diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml index 47af9bc9f..980f2713a 100644 --- a/.github/workflows/build.yml +++ b/.github/workflows/build.yml @@ -70,6 +70,7 @@ jobs: - name: Build Windows run: | pnpm run build + pnpm run plugin:bundle -- --name feishu --platform win32 --arch ${{ matrix.arch }} pnpm exec electron-builder --win --${{ matrix.arch }} --publish=never env: VITE_GITHUB_CLIENT_ID: ${{ secrets.DC_GITHUB_CLIENT_ID }} @@ -77,6 +78,11 @@ jobs: VITE_GITHUB_REDIRECT_URI: ${{ secrets.DC_GITHUB_REDIRECT_URI }} VITE_PROVIDER_DB_URL: ${{ secrets.CDN_PROVIDER_DB_URL }} + - name: Verify bundled plugins + shell: bash + run: | + pnpm run plugin:verify -- --name feishu --platform win32 --arch ${{ matrix.arch }} --plugin-root dist/win-unpacked/resources/app.asar.unpacked/plugins + - name: Upload artifacts uses: actions/upload-artifact@v6 with: @@ -125,6 +131,7 @@ jobs: - name: Build Linux run: | pnpm run build + pnpm run plugin:bundle -- --name feishu --platform linux --arch ${{ matrix.arch }} pnpm exec electron-builder --linux --${{ matrix.arch }} --publish=never env: VITE_GITHUB_CLIENT_ID: ${{ secrets.DC_GITHUB_CLIENT_ID }} @@ -132,6 +139,11 @@ jobs: VITE_GITHUB_REDIRECT_URI: ${{ secrets.DC_GITHUB_REDIRECT_URI }} VITE_PROVIDER_DB_URL: ${{ secrets.CDN_PROVIDER_DB_URL }} + - name: Verify bundled plugins + shell: bash + run: | + pnpm run plugin:verify -- --name feishu --platform linux --arch ${{ matrix.arch }} --plugin-root dist/linux-unpacked/resources/app.asar.unpacked/plugins + - name: Upload artifacts uses: actions/upload-artifact@v6 with: @@ -188,7 +200,9 @@ jobs: - name: Build Mac run: | pnpm run build - pnpm run plugin:cua:bundle:mac:${{ matrix.arch }} + pnpm run plugin:cua:build:mac:${{ matrix.arch }} + pnpm run plugin:bundle -- --name cua --platform darwin --arch ${{ matrix.arch }} + pnpm run plugin:bundle -- --name feishu --platform darwin --arch ${{ matrix.arch }} pnpm exec electron-builder --mac --${{ matrix.arch }} --publish=never env: CSC_LINK: ${{ secrets.DEEPCHAT_CSC_LINK }} @@ -203,19 +217,18 @@ jobs: NODE_OPTIONS: '--max-old-space-size=4096' VITE_PROVIDER_DB_URL: ${{ secrets.CDN_PROVIDER_DB_URL }} - - name: Verify bundled CUA plugin + - name: Verify bundled plugins shell: bash env: TARGET_ARCH: ${{ matrix.arch }} run: | - VERSION="$(node -p "require('./package.json').version")" APP_DIR="dist/mac/DeepChat.app" if [ "$TARGET_ARCH" = "arm64" ]; then APP_DIR="dist/mac-arm64/DeepChat.app" fi - PLUGIN="${APP_DIR}/Contents/Resources/app.asar.unpacked/plugins/deepchat-plugin-cua-${VERSION}-darwin-${TARGET_ARCH}.dcplugin" - test -f "$PLUGIN" - ls -lh "$PLUGIN" + PLUGIN_ROOT="${APP_DIR}/Contents/Resources/app.asar.unpacked/plugins" + pnpm run plugin:verify -- --name cua --platform darwin --arch "$TARGET_ARCH" --plugin-root "$PLUGIN_ROOT" + pnpm run plugin:verify -- --name feishu --platform darwin --arch "$TARGET_ARCH" --plugin-root "$PLUGIN_ROOT" - name: Upload artifacts uses: actions/upload-artifact@v6 diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml index 153c9266a..6d0495900 100644 --- a/.github/workflows/release.yml +++ b/.github/workflows/release.yml @@ -165,6 +165,7 @@ jobs: - name: Build Windows run: | pnpm run build + pnpm run plugin:bundle -- --name feishu --platform win32 --arch ${{ matrix.arch }} pnpm exec electron-builder --win --${{ matrix.arch }} --publish=never env: GH_TOKEN: ${{ secrets.GITHUB_TOKEN }} @@ -173,6 +174,11 @@ jobs: VITE_GITHUB_REDIRECT_URI: ${{ secrets.DC_GITHUB_REDIRECT_URI }} VITE_PROVIDER_DB_URL: ${{ secrets.CDN_PROVIDER_DB_URL }} + - name: Verify bundled plugins + shell: bash + run: | + pnpm run plugin:verify -- --name feishu --platform win32 --arch ${{ matrix.arch }} --plugin-root dist/win-unpacked/resources/app.asar.unpacked/plugins + - name: Upload artifacts uses: actions/upload-artifact@v6 with: @@ -221,6 +227,7 @@ jobs: - name: Build Linux run: | pnpm run build + pnpm run plugin:bundle -- --name feishu --platform linux --arch ${{ matrix.arch }} pnpm exec electron-builder --linux --${{ matrix.arch }} --publish=never env: GH_TOKEN: ${{ secrets.GITHUB_TOKEN }} @@ -229,6 +236,11 @@ jobs: VITE_GITHUB_REDIRECT_URI: ${{ secrets.DC_GITHUB_REDIRECT_URI }} VITE_PROVIDER_DB_URL: ${{ secrets.CDN_PROVIDER_DB_URL }} + - name: Verify bundled plugins + shell: bash + run: | + pnpm run plugin:verify -- --name feishu --platform linux --arch ${{ matrix.arch }} --plugin-root dist/linux-unpacked/resources/app.asar.unpacked/plugins + - name: Upload artifacts uses: actions/upload-artifact@v6 with: @@ -288,7 +300,9 @@ jobs: - name: Build Mac run: | pnpm run build - pnpm run plugin:cua:bundle:mac:${{ matrix.arch }} + pnpm run plugin:cua:build:mac:${{ matrix.arch }} + pnpm run plugin:bundle -- --name cua --platform darwin --arch ${{ matrix.arch }} + pnpm run plugin:bundle -- --name feishu --platform darwin --arch ${{ matrix.arch }} pnpm exec electron-builder --mac --${{ matrix.arch }} --publish=never env: CSC_LINK: ${{ secrets.DEEPCHAT_CSC_LINK }} @@ -304,19 +318,18 @@ jobs: NODE_OPTIONS: '--max-old-space-size=4096' VITE_PROVIDER_DB_URL: ${{ secrets.CDN_PROVIDER_DB_URL }} - - name: Verify bundled CUA plugin + - name: Verify bundled plugins shell: bash env: TARGET_ARCH: ${{ matrix.arch }} run: | - VERSION="$(node -p "require('./package.json').version")" APP_DIR="dist/mac/DeepChat.app" if [ "$TARGET_ARCH" = "arm64" ]; then APP_DIR="dist/mac-arm64/DeepChat.app" fi - PLUGIN="${APP_DIR}/Contents/Resources/app.asar.unpacked/plugins/deepchat-plugin-cua-${VERSION}-darwin-${TARGET_ARCH}.dcplugin" - test -f "$PLUGIN" - ls -lh "$PLUGIN" + PLUGIN_ROOT="${APP_DIR}/Contents/Resources/app.asar.unpacked/plugins" + pnpm run plugin:verify -- --name cua --platform darwin --arch "$TARGET_ARCH" --plugin-root "$PLUGIN_ROOT" + pnpm run plugin:verify -- --name feishu --platform darwin --arch "$TARGET_ARCH" --plugin-root "$PLUGIN_ROOT" - name: Upload artifacts uses: actions/upload-artifact@v6 diff --git a/CHANGELOG.md b/CHANGELOG.md index 741d50b41..0cb21b444 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -1,5 +1,19 @@ # Changelog +## v1.0.5-beta.1 (2026-05-19) +- Added an agent progress todo tool with floating progress UI and plan message rendering so long-running agent work is easier to track +- Added OpenAI-compatible video generation with model settings, generated video message rendering, and provider runtime support +- Improved TTS routing and Gemini TTS behavior with unified model settings, provider metadata, and stronger runtime coverage +- Improved Feishu plugin packaging with platform bundles, release workflow support, and updated packaging documentation +- Updated TypeScript native preview, vue-tsgo, provider registry, and ACP registry data for current tooling and runtime compatibility +- Fixed image-route chat budget handling so generated image requests avoid unnecessary context budget failures +- 新增 Agent 进度 todo 工具、浮动进度界面和计划消息渲染,让长时间 Agent 工作更容易跟踪 +- 新增 OpenAI 兼容的视频生成能力,包含模型设置、生成视频消息渲染和 Provider 运行时支持 +- 优化 TTS 路由和 Gemini TTS 表现,补齐统一模型设置、Provider 元数据和更强的运行时覆盖 +- 优化飞书插件打包,支持平台 bundle、发布 workflow,并更新插件打包文档 +- 更新 TypeScript native preview、vue-tsgo、Provider registry 和 ACP registry 数据,提升当前工具链与运行时兼容性 +- 修复图片路线的聊天预算处理,让生成图片请求避免不必要的上下文预算失败 + ## v1.0.4 (2026-05-15) - Added guided onboarding, voice input transcription, and a redesigned settings control center to make first setup and daily configuration easier - Added agent image generation, OpenAI image settings, Mac computer use, manual compaction, and side panel fullscreen controls for more capable agent workflows diff --git a/docs/features/agent-progress-todo/plan.md b/docs/features/agent-progress-todo/plan.md new file mode 100644 index 000000000..ce7470244 --- /dev/null +++ b/docs/features/agent-progress-todo/plan.md @@ -0,0 +1,175 @@ +# Agent Progress Todo 实施计划 + +## 当前基线 + +- Agent 工具定义由 `AgentToolManager.getAllToolDefinitions()` 汇总,`ToolPresenter` 根据 `disabledAgentTools` 过滤内置工具。 +- 高级工具面板 `McpIndicator.vue` 已按 `tool.server.name` 对内置工具分组,YoBrowser 通过 `yobrowser` 分区显示和开关。 +- DeepChat agent 执行链路为 `agentRuntimePresenter -> processStream -> dispatch.executeTools -> ToolPresenter.callTool -> AgentToolManager.callTool`。 +- Renderer 实时更新走 `chat.stream.updated` typed event,payload 是完整 assistant blocks snapshot。 +- 当前 shared `@shared/chat` 和 renderer display type 已支持 `plan` block,但 `@shared/types/agent-interface.d.ts` 与 `AssistantMessageBlockSchema` 还未完整纳入 `plan`。 +- ACP 已能把外部 `plan` notification 映射为 `plan` block,但 `MessageBlockPlan.vue` 目前只显示摘要和进度条,不显示完整 checklist。 + +## 架构决策 + +1. `update_plan` 是 DeepChat built-in agent tool,不是 MCP server。 +2. 新工具归入现有 Core 工具分区: + - `server.name = 'agent-core'` + - `function.name = 'update_plan'` + - 这样可直接复用 `disabledAgentTools` 和高级工具面板的单工具开关,不额外增加单工具分区。 +3. `AgentToolManager` 持有 session-scoped `PlanState`,按 `conversationId` 维护 `current/revision/updatedAt`。 +4. 工具调用成功后通过 `AgentToolProgressUpdate` 扩展出 `kind: 'agent_plan'` 把 snapshot 交给 dispatch。 +5. `dispatch.ts` 负责发布 `chat.plan.updated` typed event,不把 DeepChat `update_plan` snapshot 插入当前 assistant message。 +6. `update_plan` tool call block 标记为 internal progress tool,renderer 默认隐藏该 pill,避免重复展示“update_plan 调用完成”。 +7. `chat.plan.updated` event 和 renderer plan store 是 DeepChat todo 的实时来源。若后续需要持久化,应设计独立 progress 存储,不复用 assistant message blocks。 +8. MVP 使用可收起浮层,不把 Progress 放入 Workspace 内容区,不增加 sidepanel 顶层 tab。 + +## 数据与类型 + +新增或扩展: + +- `src/shared/types/agent-plan.ts` + - `AgentPlanStepStatus` + - `AgentPlanItem` + - `UpdatePlanArgs` + - `AgentPlanSnapshot` + - `AgentPlanState` +- `src/shared/types/agent-interface.d.ts` + - `AssistantBlockType` 增加 `plan` + - `AssistantMessageExtra` 增加 plan 相关字段类型 +- `src/shared/contracts/common.ts` + - `AssistantMessageBlockSchema.type` 增加 `plan` + - `extra` schema 保持 json record +- `src/shared/contracts/events/chat.events.ts` + - 新增 `chatPlanUpdatedEvent` +- `src/shared/contracts/events.ts` + - 导出并登记新事件 +- `src/shared/types/presenters/tool.presenter.d.ts` + - `AgentToolProgressUpdate` 增加 `agent_plan` variant + +Plan snapshot: + +```ts +interface AgentPlanSnapshot { + sessionId: string + toolCallId?: string + explanation?: string + plan: AgentPlanItem[] + revision: number + updatedAt: string +} +``` + +## Main Process Flow + +```text +Model emits update_plan tool call + -> accumulator adds tool_call block + -> dispatch.executeTools runs ToolPresenter.callTool + -> AgentToolManager validates args and updates PlanState + -> AgentToolManager emits AgentToolProgressUpdate(kind: agent_plan) + -> dispatch marks the update_plan tool call internal and publishes chat.plan.updated + -> renderer receives chat.stream.updated snapshot and chat.plan.updated live event + -> model receives tiny success result +``` + +Implementation pieces: + +- Add `agentPlanTool.ts` under `src/main/presenter/toolPresenter/agentTools/`. +- Add zod schema with `.strict()` objects and max length 12. +- Register tool definition from `AgentToolManager.getAllToolDefinitions()` only in `chatMode === 'agent'`. +- Route `toolName === UPDATE_PLAN_TOOL_NAME` in `AgentToolManager.callTool()`. +- Add helper in `dispatch.ts`: + - `markInternalPlanToolCall(blocks, toolCallId)` + - `publishPlanUpdated(snapshot, messageId)` +- Keep tool output small and context-friendly. The tool response to the model should be `{}` or `Plan updated`, not the full plan. + +## Renderer Flow + +- `MessageBlockPlan.vue` + - Replace summary-only rendering with full checklist. + - Support existing ACP `plan_entries` with `{ content, status }` and new DeepChat `{ step, status }`. + - Keep progress count in the header. + - Render empty state when `plan_entries` is empty. + - This component is compatibility UI for ACP/history; DeepChat `update_plan` does not create these blocks. +- New `AgentProgressFloat.vue` + - Input: latest active plan snapshot for current session. + - Collapsed by default. Collapsed state stored in sidepanel/session UI store or local `useStorage` keyed by session id. + - Expands and collapses with a short height/opacity transition. + - Shows only when current active session has a non-empty active plan during generation or a latest settled plan from current turn. +- Chat page integration: + - Subscribe through a small renderer client method for `chat.plan.updated`. + - Maintain `latestPlanBySession` in a small Pinia/composable store. + - Clear active floating plan when a new user turn starts and no plan has arrived yet. +- `MessageItemAssistant.vue` + - Skip rendering internal `update_plan` tool_call blocks by checking `block.extra.internalTool === true` and `block.tool_call.name === 'update_plan'`. + +## Tool Toggle UI + +- `McpIndicator.vue` + - Keep `update_plan` under existing `agent-core` grouping. + - Do not add a separate Progress group or group label. +- Existing `disabledAgentTools` storage works without a schema migration because it stores tool names. +- New sessions inherit agent default `disabledAgentTools`; built-in DeepChat default remains enabled. + +## Prompting + +Update `ToolPresenter.buildToolSystemPrompt()`: + +- Add `buildProgressPrompt(toolNames)`. +- Include rules only when `toolNames.has('update_plan')`. +- Keep this separate from formal planning responses and from question tool rules. + +## Compatibility + +- Existing ACP plan blocks should continue rendering because `MessageBlockPlan` will normalize both `{ content }` and `{ step }`. +- Existing assistant messages with summary-only `plan_entries` still render. +- DeepChat `update_plan` no longer creates new assistant `plan` blocks; this intentionally keeps the message list free of process-state todo items. +- Sessions with `disabledAgentTools` do not need migration. If a user had disabled all tools manually, `update_plan` starts enabled unless agent config later explicitly disables it. +- If `update_plan` is disabled during an active generation, the current request's tool list is not retroactively mutated; the change applies to subsequent tool refreshes, matching existing tool toggle behavior. + +## Test Strategy + +Main tests: + +- `AgentPlanTool` validation rejects unknown status, empty step, extra fields, multiple `in_progress`, and more than 12 steps. +- Valid payload increments revision and normalizes trimmed steps. +- Empty plan clears current snapshot and emits a snapshot with `plan: []`. +- `AgentToolManager` lists `update_plan` in `agent-core` for DeepChat agent mode and omits it when disabled through `ToolPresenter`. +- `ToolPresenter.buildToolSystemPrompt()` includes progress rules only when enabled. +- `dispatch.executeTools` handles `agent_plan` progress update by publishing event and not inserting any `plan` block. + +Renderer tests: + +- `MessageBlockPlan` renders completed / in_progress / pending entries with accessible status text. +- Long step text wraps without changing icon alignment. +- ACP-style `{ content }` plan entries still render. +- Internal `update_plan` tool_call block is hidden. +- `McpIndicator` shows `update_plan` inside Agent Core and toggles it through `disabledAgentTools`. +- Floating panel renders collapsed by default, animates expand/collapse, and ignores stale lower revision updates. + +Validation commands after implementation: + +```bash +pnpm run format +pnpm run i18n +pnpm run lint +pnpm run typecheck +pnpm test -- test/main/presenter/toolPresenter test/main/presenter/agentRuntimePresenter test/renderer/components/message test/renderer/components/McpIndicator.test.ts +``` + +## Risks + +- Tool-call UI noise: hidden internal tool call must be scoped only to `update_plan`, not all agent-core tools. +- Message pollution: DeepChat `update_plan` must not append process-state todo items to assistant message blocks. +- Type drift: there are multiple assistant block type definitions; all active shared/renderer schemas must include `plan`. +- Event ordering: floating panel should compare `revision` and ignore stale updates for the same session. +- Overuse by model: system prompt must explicitly skip simple one-shot tasks. + +## Rollout + +1. Implement tool and validation behind normal tool availability. +2. Add event/block support and renderer checklist. +3. Add floating panel. +4. Add tool toggle group and prompt rules. +5. Run tests and validation commands. +6. If floating panel feels intrusive in QA, keep it collapsed by default and retain `MessageBlockPlan` only as ACP/history compatibility UI. diff --git a/docs/features/agent-progress-todo/spec.md b/docs/features/agent-progress-todo/spec.md new file mode 100644 index 000000000..c21b22855 --- /dev/null +++ b/docs/features/agent-progress-todo/spec.md @@ -0,0 +1,194 @@ +# Agent Progress Todo 规格 + +## 背景 + +DeepChat agent 已经具备文件、命令、YoBrowser、skills、subagent、提问与权限交互等能力,但缺少一个轻量的“执行进度 / todo”工具。用户在多步骤任务中只能从文本和 tool call pill 推断当前状态,无法稳定看到“已完成、正在做、待处理”。 + +用户提供了 agent-progress-todo 参考文档;核心模型参考 Codex 的 `update_plan`:一次工具调用提交完整 checklist snapshot,runtime 替换当前计划并发出稳定事件,UI 渲染 progress checklist。 + +## 目标 + +- DeepChat agent 可调用 `update_plan` 更新当前任务进度。 +- 用户能在生成过程中看到当前 plan 的 completed / in_progress / pending 状态。 +- `update_plan` 作为内置 agent 核心工具出现,可在 Core 分组中按工具单独启用或停用。 +- checklist 是 agent turn 的过程态,不插入 assistant message 列表;实时展示由独立 plan event/store 驱动。 +- 生成中提供一个可收起的实时 Progress 浮层,避免用户滚动离开最新消息后失去进度可见性。 + +## 用户故事 + +### US-1:多步骤任务可见进度 + +作为用户,当我让 DeepChat agent 执行跨文件或跨阶段任务时,我希望看到已完成、正在处理、待处理的 checklist,而不是只能读 tool call 和中间文本。 + +### US-2:可控的核心工具 + +作为用户,我希望 Progress/Todo 保持在核心工具区域里,不额外增加单工具分区;如果我不希望 agent 展示计划,可以在 Core 分组中停用 `update_plan`。 + +### US-3:消息列表保持干净 + +作为用户,我希望 todo/progress 不被写入聊天消息列表,避免中间状态污染最终回答。即使后续需要持久化,也应进入独立的 progress 存储,而不是 assistant message blocks。 + +### US-4:实时但不打扰 + +作为用户,我希望执行中有一个可收起的 Progress 浮层显示最新进度;如果我不需要看,可以折叠,不影响输入区和消息阅读。 + +## MVP 范围 + +- 新增 DeepChat 内置 agent 工具 `update_plan`。 +- 工具 schema 与参考文档一致:`explanation?: string`,`plan: { step: string; status: "pending" | "in_progress" | "completed" }[]`。 +- 工具校验: + - `plan` 必须为数组,允许空数组用于清空 checklist。 + - `step` trim 后必须为非空字符串。 + - `status` 只允许 `pending | in_progress | completed`。 + - 同一 snapshot 最多一个 `in_progress`。 + - 拒绝额外字段。 + - MVP 最多 12 个 step,超出返回模型可读错误。 +- Runtime 维护 session-scoped latest plan state:`current`、`revision`、`updatedAt`。 +- DeepChat typed event 使用 `chat.plan.updated` 承载参考文档中的 `plan.update` 语义。 +- DeepChat `update_plan` 不新增 assistant `plan` block,也不在消息列表中渲染 todo。 +- 生成中浮层从最新 plan snapshot 渲染,默认收起,支持带动画的展开 / 折叠。 +- 高级工具面板在 `agent-core` 分区显示 `update_plan`,支持按单个工具停用。 +- Agent system tooling prompt 注入使用规则,避免简单任务滥用 checklist。 +- 覆盖 validation、handler、dispatch/event、UI 渲染、工具分区开关测试。 + +## UX 决策 + +MVP 不重做 Workspace 信息架构,也不把 Progress 作为 Workspace 主内容区的一部分。原因: + +- 当前右侧 sidepanel 已经有 `workspace` 与 `browser` 两个顶层 tab,Workspace 内部又包含 Files、Git、Artifacts。直接塞入实时任务状态会让 Workspace 承担过多职责。 +- Progress 是 agent turn 的执行状态,不是 workspace 文件资产。它应优先跟随 chat generation,而不是跟随文件预览。 +- 用户截图更接近一个轻量 progress panel;可收起浮层能满足实时可见性,同时保持消息列表不被过程态 todo 污染。 + +MVP UI 形态: + +- Message list:DeepChat `update_plan` 不插入 `plan` block;`update_plan` 自身 tool call pill 标记为 internal,默认不渲染。 +- Floating panel:仅当前 session 有 active plan 时显示;desktop 固定在输入区上方右侧,mobile 使用输入区上方全宽紧凑条;默认收起,可动画展开 / 折叠,折叠状态按 session 保存。 +- Tool toggle:在 Advanced Settings -> Built-in Tools 的 Core 分组中显示 `update_plan`。关闭该工具后,本轮之后的工具列表不再暴露该工具。 + +## Tool Contract + +工具名:`update_plan` + +```ts +type AgentPlanStepStatus = 'pending' | 'in_progress' | 'completed' + +interface AgentPlanItem { + step: string + status: AgentPlanStepStatus +} + +interface UpdatePlanArgs { + explanation?: string + plan: AgentPlanItem[] +} +``` + +成功结果应保持极简,推荐: + +```json +{} +``` + +错误结果必须可被模型自修复,例如: + +```text +invalid update_plan arguments: at most one step can be in_progress +``` + +## Event Contract + +Codex 参考文档里的 `plan.update` 在 DeepChat 中落为 typed event: + +```ts +interface ChatPlanUpdatedEvent { + sessionId: string + messageId: string + toolCallId?: string + plan: AgentPlanItem[] + explanation?: string + revision: number + updatedAt: string +} +``` + +语义: + +- 每个事件代表一次完整 snapshot 替换。 +- `revision` 在 session 内单调递增。 +- UI 收到更高 revision 后覆盖当前 checklist。 +- `plan.length === 0` 表示清空 active checklist。 +- 事件用于实时浮层;如后续需要持久化,应写入独立 progress 存储,不复用 assistant message blocks。 + +## Assistant Block Compatibility + +DeepChat `update_plan` 不写入 assistant `plan` block。现有 `plan` block 兼容逻辑仅用于 ACP agent notification 和已有历史消息。 + +兼容的 `plan` block `extra` 存储结构: + +```ts +{ + plan_entries: AgentPlanItem[] + plan_explanation?: string + plan_revision: number + plan_updated_at: string +} +``` + +渲染规则: + +- `explanation` 存在时显示在 checklist 上方一行。 +- `completed` 使用 dimmed style 和 check icon。 +- `in_progress` 使用 active style 和 running indicator。 +- `pending` 使用 normal/muted style 和 hollow circle。 +- 长 step 必须换行,第二行缩进到文本起始位置。 +- screen reader 文本包含本地化后的 status 与 step 文本。 + +## Agent 使用规则 + +注入到工具系统 prompt: + +```text +Use update_plan for non-trivial multi-step tasks. +Skip update_plan for simple one-shot answers or trivial edits. +Keep each plan step short, concrete, and verifiable. +Keep the plan current as work progresses. +At most one step may be in_progress at a time. +When a step completes, update the plan immediately and move the next active step to in_progress in the same call. +Use explanation only when the plan changes materially or when progress would otherwise be unclear. +``` + +## 验收标准 + +- `update_plan` 出现在 DeepChat agent 的内置工具列表中,且 `server.name` 为 `agent-core`。 +- Advanced Settings 的 Built-in Tools 中,`update_plan` 出现在 Core 分组内,可作为单个工具开关。 +- 关闭 `update_plan` 后,新请求工具定义不再包含该工具,系统 prompt 也不再包含 Progress 使用规则。 +- 有效 payload 更新 session plan state,`revision` 递增,`updatedAt` 为 ISO 8601 UTC string。 +- 无效 payload 返回模型可读错误,不更新 state,不发 `chat.plan.updated`。 +- 每次有效调用发出一个 `chat.plan.updated` event,并更新独立 renderer plan store。 +- `update_plan` 不会向当前 assistant message 插入 `plan` block。 +- `update_plan` 自身 tool call pill 不在默认消息视图中制造额外噪声。 +- 浮层默认收起,展开 / 折叠有过渡动画。 +- 浮层能渲染三种状态、长文本换行与空 plan。 +- ACP 或历史 assistant message 的 plan block 仍可正常显示。 +- 测试覆盖 validation、tool handler、dispatch/event、message block、floating panel、tool toggle。 + +## 非目标 + +- 不做 owner、deadline、priority、子任务层级。 +- 不接入外部项目管理系统。 +- 不做长期任务数据库或跨 session 任务看板。 +- 不做自动任务拆解 planner。 +- 不重做 Workspace 顶层布局。 +- 不改变 ACP agent 已有 plan notification 映射,只在必要时复用 UI 组件。 + +## 约束 + +- 遵循 DeepChat 新 renderer-main typed route / typed event 模式,不新增 legacy IPC。 +- 用户可见文案必须走 `src/renderer/src/i18n`。 +- DeepChat agent 新能力优先放在 `src/main/presenter/toolPresenter/agentTools` 与 `agentRuntimePresenter` 现有链路中。 +- 保持实现轻量,避免引入状态管理系统级复杂度。 +- 不破坏现有 ACP `plan` block 兼容展示。 + +## 开放问题 + +无。 diff --git a/docs/features/agent-progress-todo/tasks.md b/docs/features/agent-progress-todo/tasks.md new file mode 100644 index 000000000..3a2fb3e0a --- /dev/null +++ b/docs/features/agent-progress-todo/tasks.md @@ -0,0 +1,79 @@ +# Agent Progress Todo 任务清单 + +## T0 规格冻结 + +- [x] 阅读 SDD 规范与用户提供的 Codex progress 设计文档。 +- [x] 梳理 DeepChat 当前 agent tool、dispatch、message block、tool toggle、sidepanel/workspace 基线。 +- [x] 明确 MVP UI 决策:聊天内 checklist + 可收起浮层,不重做 Workspace。 +- [x] 移除开放澄清项。 + +## T1 Shared Types 与 Event Contract + +- [x] 新增 `src/shared/types/agent-plan.ts`。 +- [x] 更新 `src/shared/types/agent-interface.d.ts` 的 assistant block 类型与 extra 字段。 +- [x] 更新 `src/shared/contracts/common.ts` 允许 `plan` block。 +- [x] 新增并登记 `chat.plan.updated` typed event。 +- [x] 更新 renderer display type 中 plan extra 的更具体类型。 + +## T2 update_plan 工具与校验 + +- [x] 新增 `src/main/presenter/toolPresenter/agentTools/agentPlanTool.ts`。 +- [x] 定义 `UPDATE_PLAN_TOOL_NAME` 与 zod schema。 +- [x] 实现 strict validation、最多 12 steps、最多一个 `in_progress`。 +- [x] 实现 session-scoped `PlanState` 和 revision 递增。 +- [x] 成功时返回极简 tool result,失败时返回模型可读错误。 +- [x] 添加 main 单测覆盖 validation 和 state 更新。 + +## T3 ToolPresenter 集成与提示词 + +- [x] 在 `AgentToolManager.getAllToolDefinitions()` 注册 `agent-core/update_plan`。 +- [x] 在 `AgentToolManager.callTool()` 路由 `update_plan`。 +- [x] 扩展 `AgentToolProgressUpdate` 支持 `agent_plan`。 +- [x] 在 `ToolPresenter.buildToolSystemPrompt()` 注入 Progress 使用规则。 +- [x] 确认 `disabledAgentTools` 可过滤 `update_plan`。 +- [x] 添加 ToolPresenter/AgentToolManager 单测。 + +## T4 Dispatch 与 Message Block 更新 + +- [x] 在 `dispatch.ts` 处理 `agent_plan` progress update。 +- [x] 不向 current assistant message 插入 `plan` block。 +- [x] 标记 `update_plan` tool_call block 为 internal。 +- [x] 发布 `chat.plan.updated` event。 +- [x] 确保 empty plan 清空 active checklist。 +- [x] 添加 dispatch 单测覆盖 update 只发 event 且不插入 plan block。 + +## T5 Renderer Checklist + +- [x] 重写 `MessageBlockPlan.vue` 为完整 checklist。 +- [x] 兼容 ACP `{ content, status }` 与 DeepChat `{ step, status }` 两种 entry。 +- [x] 增加 completed / in_progress / pending 三态样式。 +- [x] 增加 empty state 与 screen reader 文本。 +- [x] 在 `MessageItemAssistant.vue` 隐藏 internal `update_plan` tool call。 +- [x] 添加 renderer 组件测试。 + +## T6 Floating Progress Panel + +- [x] 新增 `AgentProgressFloat.vue`。 +- [x] 新增或扩展 renderer store/composable 维护 latest plan snapshot。 +- [x] 订阅 `chat.plan.updated`,按 session 和 revision 去重。 +- [x] 在 `ChatPage.vue` 输入区上方挂载浮层。 +- [x] 支持 per-session collapsed state,默认收起。 +- [x] 增加展开 / 收起动画。 +- [x] 添加浮层渲染与折叠测试。 + +## T7 工具分区开关与 i18n + +- [x] 确认 `update_plan` 出现在现有 Agent Core 分组中。 +- [x] 不新增单独 Progress 分组或分组 i18n 文案。 +- [x] 确认草稿会话和已有 session 都能开关 `update_plan`。 +- [x] 更新 DeepChat agent settings 工具列表展示需要的分组标签。 +- [x] 添加 `McpIndicator` 测试覆盖 Core 内单工具 toggle。 + +## T8 验证 + +- [x] 运行 `pnpm run format`。 +- [x] 运行 `pnpm run i18n`。 +- [x] 运行 `pnpm run lint`。 +- [x] 运行 `pnpm run typecheck`。 +- [x] 运行相关 main/renderer 测试。 +- [ ] 手动验证一个多步骤 agent 任务能显示、更新、完成和隐藏 progress。 diff --git a/docs/features/openai-compatible-video-generation/plan.md b/docs/features/openai-compatible-video-generation/plan.md new file mode 100644 index 000000000..37b2c5b4f --- /dev/null +++ b/docs/features/openai-compatible-video-generation/plan.md @@ -0,0 +1,42 @@ +# Plan + +## Approach +Treat video generation as a first-class model capability parallel to image generation and TTS: +- Extend shared model/type enums and model-db parsing to include `videoGeneration`. +- Add a shared video compatibility helper that can recover video intent from model metadata, endpoint hints, modalities, or known model ID patterns when upstream data is incomplete. +- Add an OpenAI-compatible video runtime path that sends requests to `/v1/videos`, normalizes provider responses, and emits media output into the assistant stream. +- Reuse the current assistant media block transport by carrying video payloads through the existing message block structure with video MIME detection on the renderer side. + +## Affected Areas +- Shared types/contracts: + - `src/shared/model.ts` + - `src/shared/types/model-db.ts` + - `src/shared/types/presenters/llmprovider.presenter.d.ts` + - `src/shared/types/presenters/legacy.presenters.d.ts` + - `src/shared/videoGenerationSettings.ts` (new) +- Main runtime/provider: + - `src/main/presenter/configPresenter/index.ts` + - `src/main/presenter/configPresenter/modelConfig.ts` + - `src/main/presenter/llmProviderPresenter/index.ts` + - `src/main/presenter/llmProviderPresenter/providers/aiSdkProvider.ts` + - `src/main/presenter/llmProviderPresenter/aiSdk/runtime.ts` +- Renderer: + - `src/renderer/src/composables/useModelTypeDetection.ts` + - `src/renderer/src/components/chat/messageListItems.ts` + - `src/renderer/src/components/message/MessageItemAssistant.vue` + - `src/renderer/src/components/message/MessageBlockVideo.vue` (new) + - `src/renderer/settings/components/ProviderModelList.vue` +- Model DB: + - `resources/model-db/providers.json` + +## Compatibility +- Existing text, image, and TTS paths remain unchanged. +- Existing assistant block persistence remains compatible by reusing the current media payload field rather than changing the storage shape. +- Future video models can plug in through shared detection helpers or explicit `videoGeneration` metadata. + +## Verification Strategy +Run: +- `pnpm run typecheck` +- `pnpm run format` +- `pnpm run i18n` +- `pnpm run lint` diff --git a/docs/features/openai-compatible-video-generation/spec.md b/docs/features/openai-compatible-video-generation/spec.md new file mode 100644 index 000000000..66550c902 --- /dev/null +++ b/docs/features/openai-compatible-video-generation/spec.md @@ -0,0 +1,32 @@ +# OpenAI-Compatible Video Generation + +## User Need +Users need DeepChat to recognize and run video generation models such as `doubao-seedance-2-0-fast-260128` through the same model-driven provider flow used by text and audio generation, without hardcoding one-off provider logic for each future video model. + +## Goal +Enable first-class video generation routing in DeepChat for OpenAI-compatible providers, starting with AIHubMix Seedance models and leaving a compatibility layer for future video models. + +## Acceptance Criteria +1. Shared model/type contracts support `videoGeneration` and preserve compatibility with existing model metadata. +2. DeepChat can recognize `doubao-seedance-2-0-fast-260128` as a video generation model even when upstream metadata is incomplete or still marked as `chat`. +3. Main runtime can route video generation requests through an OpenAI-compatible `/v1/videos` flow. +4. Video generation responses are normalized into a stable internal result shape that future providers/models can reuse. +5. Generated video output reaches the existing assistant message pipeline and renders in the chat UI. +6. Validation commands pass: +- `pnpm run typecheck` +- `pnpm run format` +- `pnpm run i18n` +- `pnpm run lint` + +## Constraints +- Keep the provider integration generic for OpenAI-compatible video endpoints. +- Reuse the current assistant media block pipeline where practical instead of introducing a parallel storage format. +- Do not scope in advanced video editing controls or provider-specific parameter UIs for this change. + +## Non-Goals +- Dedicated video generation settings panels. +- Agent-level video generation tool configuration. +- Non-OpenAI-compatible video provider protocols. + +## Open Questions +- None for current scope. diff --git a/docs/features/openai-compatible-video-generation/tasks.md b/docs/features/openai-compatible-video-generation/tasks.md new file mode 100644 index 000000000..d27f8ab8f --- /dev/null +++ b/docs/features/openai-compatible-video-generation/tasks.md @@ -0,0 +1,25 @@ +# Tasks + +## Shared Types + Detection +- [x] Add `ModelType.VideoGeneration` and extend model-db parsing/schema for `videoGeneration`. +- [x] Add shared video detection/compatibility helpers for endpoint hints, modalities, and known model IDs. +- [x] Update model config inference to classify video models consistently in main and renderer flows. +- [x] Extend session generation settings/contracts and draft state to carry `videoGeneration` options. + +## Runtime + Provider +- [x] Add `generateVideoStandalone` presenter contracts and implementation. +- [x] Add OpenAI-compatible `/v1/videos` request/response normalization in the AI SDK runtime/provider path. +- [x] Persist and sanitize session-level video generation settings through agent runtime and sqlite storage. +- [ ] Mark Seedance built-in model metadata as `videoGeneration` where available. + +## Renderer +- [x] Expose video model detection for UI behavior alignment. +- [x] Add assistant message rendering for generated video media. +- [x] Update model list/type display for video generation models. +- [x] Expose video generation settings in chat status bar and model config dialog flows. + +## Validation +- [x] Run `pnpm run typecheck`. +- [x] Run `pnpm run format`. +- [x] Run `pnpm run i18n`. +- [x] Run `pnpm run lint`. diff --git a/docs/features/unified-tts-provider/plan.md b/docs/features/unified-tts-provider/plan.md new file mode 100644 index 000000000..2d6f02b05 --- /dev/null +++ b/docs/features/unified-tts-provider/plan.md @@ -0,0 +1,37 @@ +# Plan + +## Approach +Treat TTS as a first-class model capability and follow the `ImageGeneration` routing strategy: +- Extend shared model/type schema to include `tts`. +- Add runtime TTS routing ahead of default chat generation. +- Dispatch by model pattern: + - Pattern A: `/v1/audio/speech` + - Pattern B: `/v1/chat/completions` with `audio` output +- Normalize returned audio into data URL and cache through existing device cache, then emit `image_data` with audio MIME type. + +## Affected Areas +- Shared types/contracts: + - `src/shared/model.ts` + - `src/shared/types/model-db.ts` + - `src/shared/types/presenters/legacy.presenters.d.ts` + - `src/shared/contracts/common.ts` + - `src/shared/contracts/domainSchemas.ts` + - `src/shared/ttsSettings.ts` (new) +- Main runtime/provider: + - `src/main/presenter/llmProviderPresenter/aiSdk/runtime.ts` + - `src/main/presenter/llmProviderPresenter/providers/aiSdkProvider.ts` +- Model DB: + - `resources/model-db/providers.json` +- Renderer model type detection: + - `src/renderer/src/composables/useModelTypeDetection.ts` + +## Compatibility +- Existing chat and image generation paths remain unchanged. +- Existing renderer audio playback remains unchanged because it already handles `image_data` with `audio/*` MIME. + +## Verification Strategy +Run: +- `pnpm run typecheck` +- `pnpm run format` +- `pnpm run i18n` +- `pnpm run lint` diff --git a/docs/features/unified-tts-provider/spec.md b/docs/features/unified-tts-provider/spec.md new file mode 100644 index 000000000..beba05f9f --- /dev/null +++ b/docs/features/unified-tts-provider/spec.md @@ -0,0 +1,34 @@ +# Unified TTS Provider (Model-Level) + +## User Need +Users want TTS integrated as a model capability (`ModelType.TTS`) instead of per-provider custom integration, so any OpenAI-compatible provider can work if its model metadata marks TTS support. + +## Goal +Enable model-level TTS routing in DeepChat similar to image generation routing, including: +- Standard OpenAI `/v1/audio/speech` TTS models +- Chat-completions-audio TTS models that return base64 audio + +## Acceptance Criteria +1. `ModelType.TTS` is available in shared model contracts and model-db schema. +2. Runtime can route TTS models by model capability metadata and endpoint hints. +3. Runtime supports both TTS patterns and emits `image_data` events with `audio/*` MIME type for existing renderer playback. +4. Model DB can represent TTS model type for built-in provider entries. +5. Frontend model type detection exposes TTS model state for UI behavior alignment. +6. Validation commands pass: +- `pnpm run typecheck` +- `pnpm run format` +- `pnpm run i18n` +- `pnpm run lint` + +## Constraints +- Reuse existing audio rendering path via `image_data`; avoid introducing new stream event types. +- Keep provider integration generic for OpenAI-compatible providers. +- Do not introduce dedicated UI for TTS settings in this scope. + +## Non-Goals +- New TTS player UI. +- Voice catalog fetching UX. +- VoiceAI provider refactor. + +## Open Questions +- None for current scope. diff --git a/docs/features/unified-tts-provider/tasks.md b/docs/features/unified-tts-provider/tasks.md new file mode 100644 index 000000000..10e2e1cb3 --- /dev/null +++ b/docs/features/unified-tts-provider/tasks.md @@ -0,0 +1,22 @@ +# Tasks + +## Shared Types + Runtime +- [x] Add `ModelType.TTS` and `ApiEndpointType.AudioSpeech` in shared model enums. +- [x] Extend model-db schema and parser for `tts` type. +- [x] Add `src/shared/ttsSettings.ts` helpers for pattern detection and format normalization. +- [x] Extend presenter model config contracts with optional `tts` settings. +- [x] Add TTS route in runtime supporting pattern A and pattern B. +- [x] Inject `shouldUseTts` capability check from AI SDK provider. + +## Model DB +- [x] Mark relevant `aihubmix` models as `type: "tts"` in provider model list. +- [x] Evaluate whether built-in `xiaomimimo` provider entry exists; it does not, so built-in DB coverage is skipped. + +## Renderer +- [x] Extend `useModelTypeDetection` to include `tts` and expose `isTtsModel`. + +## Validation +- [x] Run `pnpm run typecheck`. +- [x] Run `pnpm run format`. +- [x] Run `pnpm run i18n`. +- [x] Run `pnpm run lint`. diff --git a/docs/features/v1-0-5-beta-1-release/plan.md b/docs/features/v1-0-5-beta-1-release/plan.md new file mode 100644 index 000000000..d476c9d54 --- /dev/null +++ b/docs/features/v1-0-5-beta-1-release/plan.md @@ -0,0 +1,22 @@ +# v1.0.5 Beta 1 Release Plan + +## Release Metadata + +- Update `package.json` from `1.0.4` to `1.0.5-beta.1`. +- Add the `v1.0.5-beta.1` changelog section dated `2026-05-19`. +- Derive release notes from commits after `v1.0.4`. + +## Validation + +- Run `pnpm run format`. +- Run `pnpm run i18n`. +- Run `pnpm run lint`. +- Run `pnpm run typecheck` before cutting the release branch. + +## Publishing + +- Commit the metadata on `dev`. +- Push `dev`. +- Cut `release/v1.0.5-beta.1` from the release-ready `dev` commit. +- Open the release PR to `main` for review and CI. +- Fast-forward `main`, tag `v1.0.5-beta.1`, and clean up the release branch after PR approval. diff --git a/docs/features/v1-0-5-beta-1-release/spec.md b/docs/features/v1-0-5-beta-1-release/spec.md new file mode 100644 index 000000000..092d768f5 --- /dev/null +++ b/docs/features/v1-0-5-beta-1-release/spec.md @@ -0,0 +1,22 @@ +# v1.0.5 Beta 1 Release Spec + +## User Story + +As a DeepChat maintainer, I want to publish `v1.0.5-beta.1` so beta users can try the accumulated changes after the `v1.0.4` stable release. + +## Acceptance Criteria + +- The root package version is `1.0.5-beta.1`. +- `CHANGELOG.md` contains a top-level `v1.0.5-beta.1 (2026-05-19)` section. +- Release notes summarize user-visible and release-relevant changes since `v1.0.4`. +- The release branch and tag use `release/v1.0.5-beta.1` and `v1.0.5-beta.1`. + +## Non-Goals + +- No product behavior changes are introduced as part of the release metadata update. +- No historical changelog sections are rewritten. + +## Constraints + +- Follow the repository release flow with `dev` as the integration branch and `main` updated by fast-forward. +- Keep changelog entries bilingual with English bullets before Chinese bullets. diff --git a/docs/features/v1-0-5-beta-1-release/tasks.md b/docs/features/v1-0-5-beta-1-release/tasks.md new file mode 100644 index 000000000..15fba38a6 --- /dev/null +++ b/docs/features/v1-0-5-beta-1-release/tasks.md @@ -0,0 +1,9 @@ +# v1.0.5 Beta 1 Release Tasks + +- [x] Confirm current branch, working tree, release branch, and tag state. +- [x] Update package version and changelog. +- [x] Run format, i18n, lint, and typecheck checks. +- [ ] Commit and push release metadata on `dev`. +- [ ] Cut and push `release/v1.0.5-beta.1`. +- [ ] Open the release PR to `main`. +- [ ] Fast-forward `main`, tag `v1.0.5-beta.1`, and clean up the release branch after approval. diff --git a/docs/guides/plugin-packaging.md b/docs/guides/plugin-packaging.md index ea3864127..8c5a40502 100644 --- a/docs/guides/plugin-packaging.md +++ b/docs/guides/plugin-packaging.md @@ -23,97 +23,150 @@ Official packages keep DeepChat release asset URLs in their manifest metadata: https://github.com/ThinkInAIXYZ/deepchat/releases/download/v/.dcplugin ``` -## CUA Plugin Artifacts +Output naming pattern: `deepchat-plugin--[--].dcplugin` -The CUA plugin ships one macOS helper app per CPU architecture. The bundled package filename -includes both platform and architecture: +## Generic Commands -```text -deepchat-plugin-cua--darwin-arm64.dcplugin -deepchat-plugin-cua--darwin-x64.dcplugin -``` +All plugins share a common set of commands powered by `scripts/plugin.mjs`, which delegates to +`scripts/package-plugin.mjs` for the actual packaging logic. -The manifest inside each package keeps the official DeepChat release-download namespace for trust -metadata. Runtime detection inside the package uses the same architecture-specific plugin path: +### Validate -```text -plugin:runtime/darwin//DeepChat Computer Use.app/Contents/MacOS/cua-driver +Dry-run: validates the manifest and file references without producing a `.dcplugin`. + +```bash +pnpm run plugin:validate -- --name --platform --arch ``` -Architecture mapping: +### Package -| DeepChat arch | Swift arch | Runtime directory | -| --- | --- | --- | -| `arm64` | `arm64` | `runtime/darwin/arm64/` | -| `x64` | `x86_64` | `runtime/darwin/x64/` | +Build (if the plugin has a native build step) and package into a `.dcplugin` under `dist/plugins/`. -Each `.dcplugin` contains only the runtime directory for its target architecture. +```bash +pnpm run plugin:package -- --name --platform --arch +``` -## Local Commands +### Bundle -Validate the package metadata for the current host architecture: +Package into `build/bundled-plugins/` for embedding into the Electron app. ```bash -pnpm run plugin:cua:validate +pnpm run plugin:bundle -- --name --platform --arch ``` -Build and package the current host architecture: +### Verify + +Verify expected bundled official plugin artifacts from plugin metadata. ```bash -pnpm run plugin:cua:package +pnpm run plugin:verify -- --name --platform --arch --plugin-root ``` -Build and package explicit macOS architectures: +When `--name` is omitted, the script verifies all official plugins supported by the target platform. + +### Clean + +Remove all bundled plugin artifacts: ```bash -pnpm run plugin:cua:package:mac:arm64 -pnpm run plugin:cua:package:mac:x64 +pnpm run plugin:bundle:clean ``` -Build the package that will be embedded into the macOS app: +## Plugins with Native Build Steps + +Some plugins (like CUA) include pre-compiled native binaries. These require an additional build +step before packaging. The dispatcher script automatically detects and runs +`scripts/build--plugin-runtime.mjs` when it exists. + +CUA native build commands (macOS-only, requires Swift toolchain): ```bash -pnpm run plugin:cua:bundle:mac:arm64 -pnpm run plugin:cua:bundle:mac:x64 +pnpm run plugin:cua:build # host architecture +pnpm run plugin:cua:build:mac:arm64 # explicit ARM64 +pnpm run plugin:cua:build:mac:x64 # explicit x64 ``` -Validate explicit macOS architectures after their helper runtimes have been staged: +## CUA Plugin Artifacts -```bash -pnpm run plugin:cua:validate:mac:arm64 -pnpm run plugin:cua:validate:mac:x64 +The CUA plugin ships one macOS helper app per CPU architecture. The bundled package filename +includes both platform and architecture: + +```text +deepchat-plugin-cua--darwin-arm64.dcplugin +deepchat-plugin-cua--darwin-x64.dcplugin +``` + +Runtime detection inside the package uses architecture-specific paths: + +```text +plugin:runtime/darwin//DeepChat Computer Use.app/Contents/MacOS/cua-driver +``` + +Each `.dcplugin` contains only the runtime directory for its target architecture. + +## Feishu Plugin Artifacts + +The feishu plugin targets all platforms (darwin, linux, win32). Its MCP server uses +`node serve.mjs` which calls `npx` at runtime to download the `@larksuiteoapi/lark-mcp` +package on first use. + +```text +deepchat-plugin-feishu--darwin-arm64.dcplugin +deepchat-plugin-feishu--darwin-x64.dcplugin +deepchat-plugin-feishu--linux-x64.dcplugin +deepchat-plugin-feishu--win32-x64.dcplugin ``` -Standalone packages are written to: +## Output Locations + +Standalone packages: ```text dist/plugins/ ``` -Bundled packages are written to: +Bundled packages (embedded into the Electron app): ```text build/bundled-plugins/ ``` -## CI And Release +## CI and Release + +The build matrix in `.github/workflows/build.yml` bundles plugins before running `electron-builder` +on every platform: + +- **macOS**: bundles both CUA (with native build) and feishu plugins. +- **Linux**: bundles feishu plugin only (CUA is macOS-only). +- **Windows**: bundles feishu plugin only. -The macOS build matrix in `.github/workflows/build.yml` builds the matching CUA plugin bundle before -running `electron-builder`. Electron Builder embeds it into: +Electron Builder embeds `.dcplugin` files from `build/bundled-plugins/` into: ```text -DeepChat.app/Contents/Resources/app.asar.unpacked/plugins/ +/Contents/Resources/app.asar.unpacked/plugins/ (macOS) +/resources/app.asar.unpacked/plugins/ (Windows/Linux) ``` -Each matrix job verifies the expected bundled `.dcplugin` exists inside the app before uploading -artifacts. +Each matrix job verifies the expected bundled `.dcplugin` files exist inside the app before +uploading artifacts. -The release workflow repeats the same bundled package step. The final release uploads app artifacts -only; `.dcplugin` files are not published as separate GitHub Release assets. +The release workflow (`.github/workflows/release.yml`) repeats the same steps. Final release +uploads app artifacts only; `.dcplugin` files are not published as separate GitHub Release assets. -Expected embedded files: +Expected embedded files (macOS example): ```text app.asar.unpacked/plugins/deepchat-plugin-cua--darwin-x64.dcplugin app.asar.unpacked/plugins/deepchat-plugin-cua--darwin-arm64.dcplugin +app.asar.unpacked/plugins/deepchat-plugin-feishu--darwin-x64.dcplugin +app.asar.unpacked/plugins/deepchat-plugin-feishu--darwin-arm64.dcplugin ``` + +## Adding a New Plugin + +1. Create `plugins//plugin.json` with required fields (`id`, `name`, `version`, `publisher`, + `source`, `engines.platforms`, skills, settings contributions). +2. If the plugin needs a native build step, create `scripts/build--plugin-runtime.mjs`. +3. Test locally: `pnpm run plugin:validate -- --name --platform --arch ` +4. Add bundling commands to the CI workflows for the relevant platforms. +5. Add verification steps to CI to confirm the `.dcplugin` is embedded in the built app. diff --git a/docs/issues/assistant-action-type-null-renderer-crash/plan.md b/docs/issues/assistant-action-type-null-renderer-crash/plan.md new file mode 100644 index 000000000..d564ab21a --- /dev/null +++ b/docs/issues/assistant-action-type-null-renderer-crash/plan.md @@ -0,0 +1,14 @@ +# Assistant `action_type` Null Renderer Crash Plan + +## Approach + +- Normalize persisted action types inside `DeepChatMessageStore` while converting `DeepChatAssistantBlockRow` rows into `AssistantMessageBlock` objects. +- Return only `tool_call_permission`, `question_request`, or `rate_limit`; treat `null` and unknown strings as absent. +- Build the hydrated block with conditional spreading so omitted action types are not serialized as `null` or `undefined`. +- Keep `AssistantMessageBlockSchema` unchanged to preserve route/event validation. + +## Tests + +- Extend `messageStore` tests to materialize assistant rows containing nullable content/tool blocks and assert the resulting JSON omits `action_type`. +- Add a mixed persisted-block regression where an unknown value is omitted and a valid action block is retained. +- Pass hydrated blocks through `cloneBlocksForRenderer()` to verify the renderer snapshot contract accepts them. diff --git a/docs/issues/assistant-action-type-null-renderer-crash/spec.md b/docs/issues/assistant-action-type-null-renderer-crash/spec.md new file mode 100644 index 000000000..b090c10af --- /dev/null +++ b/docs/issues/assistant-action-type-null-renderer-crash/spec.md @@ -0,0 +1,24 @@ +# Assistant `action_type` Null Renderer Crash + +## Problem + +Resuming a tool interaction can reload assistant message blocks from the normalized SQLite table. That table stores `action_type` as nullable text, and hydrated non-action blocks currently carry `action_type: null` into runtime message content. Renderer flushes then validate the block array with `AssistantMessageBlockSchema`, which allows an omitted `action_type` but rejects `null`, causing stream finalization and tool-interaction routes to fail. + +## Goals + +- Keep nullable `action_type` as a storage detail only. +- Materialize assistant blocks with `action_type` omitted unless the persisted value is a supported renderer action type. +- Preserve the strict renderer/event contract so invalid message shapes are still rejected before publication. + +## Non-Goals + +- No schema migration for `deepchat_assistant_blocks`. +- No IPC, route, renderer component, or public type changes. +- No behavior change for valid `tool_call_permission`, `question_request`, or `rate_limit` blocks. + +## Acceptance Criteria + +- Hydrated content/tool blocks with `action_type = NULL` do not include an `action_type` property. +- Hydrated rows with unknown `action_type` values omit the property instead of crashing renderer publication. +- Valid persisted action blocks keep their action type. +- Regression tests cover hydration and renderer cloning for the affected shapes. diff --git a/docs/issues/assistant-action-type-null-renderer-crash/tasks.md b/docs/issues/assistant-action-type-null-renderer-crash/tasks.md new file mode 100644 index 000000000..fd0ff40cc --- /dev/null +++ b/docs/issues/assistant-action-type-null-renderer-crash/tasks.md @@ -0,0 +1,6 @@ +# Assistant `action_type` Null Renderer Crash Tasks + +- [x] Document the issue spec, implementation plan, and task list. +- [x] Normalize persisted `action_type` values during assistant block hydration. +- [x] Add regression tests for nullable and unknown persisted action types. +- [x] Run targeted tests and final repository gates. diff --git a/docs/issues/image-generation-context-budget-bypass/plan.md b/docs/issues/image-generation-context-budget-bypass/plan.md new file mode 100644 index 000000000..8557e630b --- /dev/null +++ b/docs/issues/image-generation-context-budget-bypass/plan.md @@ -0,0 +1,24 @@ +# Image Generation Context Budget Bypass Plan + +## Approach + +- Add a model-aware Agent runtime helper that returns true only when DeepChat should use its chat + context budget. +- Keep ACP bypass behavior, and also bypass when the model config explicitly identifies + `ImageGeneration`, `TTS`, a non-chat API endpoint, or `endpointType === 'image-generation'`. +- Treat missing legacy model metadata as chat-compatible. + +## Runtime Changes + +- Use the helper in new user turns and resume/retry context construction before deciding whether to + compact, trim, or use a finite chat context length. +- Use the helper inside the provider-call wrapper before running preflight/recovery or shrinking the + per-call `maxTokens`. +- Leave `contextBudget.ts`, public contracts, IPC, and renderer code unchanged. + +## Test Strategy + +- Add an Agent runtime regression for an image endpoint request that would fail chat-budget + preflight, asserting the provider is still called and max tokens are preserved. +- Keep chat-model pressure tests verifying the existing budget preflight path still runs. +- Run the targeted Agent runtime/context budget tests plus repository format, i18n, and lint checks. diff --git a/docs/issues/image-generation-context-budget-bypass/spec.md b/docs/issues/image-generation-context-budget-bypass/spec.md new file mode 100644 index 000000000..cc61002f3 --- /dev/null +++ b/docs/issues/image-generation-context-budget-bypass/spec.md @@ -0,0 +1,41 @@ +# Image Generation Context Budget Bypass Spec + +> Status: Draft +> Date: 2026-05-18 + +## Background + +DeepChat Agent applies a chat-oriented provider-call context preflight before sending model +requests. The check estimates message tokens, tool schemas, and output tokens, then blocks requests +that cannot fit inside the configured model context window. + +That check is valid for chat models, but image generation and other non-chat routes do not use the +same request shape. Image requests can therefore fail before reaching the provider with: + +`Request was not sent because it cannot fit within the model context window after applying the safety margin.` + +## Goals + +- Only apply DeepChat's chat context budget to chat model requests. +- Skip the chat budget preflight, compaction recovery, and temporary max-token shrink for explicit + image generation and other non-chat model routes. +- Preserve current behavior for chat models and ACP provider bypasses. + +## Acceptance Criteria + +- Image generation models or image endpoints reach the provider even when chat-budget estimation + would fail. +- Non-chat requests do not trigger the DeepChat context-pressure compaction path solely because of + chat message/tool-schema estimates. +- Non-chat request max tokens are not reduced by the chat preflight safety margin. +- Chat models keep the existing preflight, recovery, and overflow failure behavior. +- Existing legacy model configs without explicit type or endpoint metadata continue to be treated as + chat requests. +- No public API, IPC, schema, or renderer UI changes are introduced. + +## Non-Goals + +- Redesign image generation request construction. +- Change the agent image generation tool behavior for chat models. +- Change `contextBudget.ts` budgeting math. +- Add renderer UI for non-chat routing diagnostics. diff --git a/docs/issues/image-generation-context-budget-bypass/tasks.md b/docs/issues/image-generation-context-budget-bypass/tasks.md new file mode 100644 index 000000000..727a38d9b --- /dev/null +++ b/docs/issues/image-generation-context-budget-bypass/tasks.md @@ -0,0 +1,7 @@ +# Image Generation Context Budget Bypass Tasks + +- [x] Document the issue and intended behavior. +- [x] Add model-aware chat budget gating in the Agent runtime. +- [x] Add regression coverage for image endpoint bypass. +- [x] Verify chat context budget behavior remains unchanged. +- [x] Run targeted tests and repository quality checks. diff --git a/docs/issues/merge-dev-into-gen-video/plan.md b/docs/issues/merge-dev-into-gen-video/plan.md new file mode 100644 index 000000000..caf4ddd68 --- /dev/null +++ b/docs/issues/merge-dev-into-gen-video/plan.md @@ -0,0 +1,20 @@ +# Plan + +## Scope +将 `origin/dev` 合并到当前 `gen-video` 分支,识别并解决冲突文件,保留双方必要改动,并执行仓库要求的基础校验。 + +## Implementation decisions +- 先 `git fetch origin dev`,再执行 `git merge origin/dev` 以基于最新远端 `dev` 合并。 +- 冲突解决前先阅读每个冲突文件的上下文,按文件现有模式做最小修改。 +- 若冲突涉及文档或配置,同样遵循最小差异原则,不借机整理无关内容。 +- 合并完成后执行仓库要求的 `pnpm run format`、`pnpm run i18n`、`pnpm run lint`。若命令失败,记录失败点并告知用户。 + +## Risks and mitigations +- 风险:冲突文件较多且分散,容易误删一侧逻辑。 + - 缓解:逐文件阅读冲突块上下文后再编辑,并在完成后检查 diff。 +- 风险:格式化或 lint 暴露既有问题,影响本次验证。 + - 缓解:优先区分新引入问题与仓库既有问题,向用户明确说明。 + +## Test strategy +- 使用 `git status` 确认冲突已清除。 +- 使用格式化、i18n、lint 命令验证合并后仓库状态。 diff --git a/docs/issues/merge-dev-into-gen-video/spec.md b/docs/issues/merge-dev-into-gen-video/spec.md new file mode 100644 index 000000000..825557004 --- /dev/null +++ b/docs/issues/merge-dev-into-gen-video/spec.md @@ -0,0 +1,23 @@ +# Merge dev into gen-video + +## User stories +- 作为 `gen-video` 分支开发者,我需要合并最新 `dev` 变更到当前分支,以便继续在最新主线基础上开发。 +- 作为评审者,我需要本次冲突解决范围清晰、仅限必要文件,并保留两侧已完成的有效修改。 + +## Acceptance criteria +- 当前分支成功合并 `origin/dev`,不存在未解决的 merge conflict。 +- 冲突文件采用最小变更原则解决,不引入与本次合并无关的重构。 +- 合并后工作区状态可继续提交,且相关校验命令已执行并记录结果。 + +## Non-goals +- 不在本次任务中实现新的产品功能。 +- 不主动修改与冲突无关的历史代码风格。 +- 不提交 commit,除非用户额外要求。 + +## Constraints +- 仅处理 `dev` 合并到当前 `gen-video` 分支产生的冲突。 +- 遵循仓库现有 SDD、格式化、i18n、lint 规范。 +- 如需保留双方逻辑,优先基于现有实现做兼容合并,而非重写。 + +## Open questions +- 无 diff --git a/docs/issues/merge-dev-into-gen-video/tasks.md b/docs/issues/merge-dev-into-gen-video/tasks.md new file mode 100644 index 000000000..f234a30a5 --- /dev/null +++ b/docs/issues/merge-dev-into-gen-video/tasks.md @@ -0,0 +1,8 @@ +# Tasks + +1. 获取最新 `origin/dev` 并确认当前分支状态。 +2. 创建本次合并的 SDD 文档并记录范围、约束、验证方式。 +3. 执行 `git merge origin/dev`,定位所有冲突文件。 +4. 阅读冲突文件上下文,逐个解决冲突并保留必要改动。 +5. 运行 `pnpm run format`、`pnpm run i18n`、`pnpm run lint`。 +6. 汇总结果与后续建议,等待用户决定是否提交。 diff --git a/docs/issues/openai-compatible-video-prompt-duration-fallback/plan.md b/docs/issues/openai-compatible-video-prompt-duration-fallback/plan.md new file mode 100644 index 000000000..2f7ed4812 --- /dev/null +++ b/docs/issues/openai-compatible-video-prompt-duration-fallback/plan.md @@ -0,0 +1,21 @@ +# Plan + +## Approach +Add a small runtime helper that extracts an integer duration from obvious prompt hints only when structured video settings are absent and the parsed value is supported by the active model, then reuse that helper for both request tracing and the actual `/videos` request body. + +## Implementation +- Add a focused runtime test that exercises the OpenAI-compatible `/videos` flow and asserts `duration: 2` is sent for prompts like `... 2s`. +- Add a conservative prompt-duration extractor for `Ns`, `N sec`, `N seconds`, and `N秒`. +- Enforce model-specific validity before injecting the derived duration (for Seedance, `4~15`). +- Apply the fallback only when `videoGeneration.duration` and `videoGeneration.seconds` are both unset. + +## Affected Files +- `src/main/presenter/llmProviderPresenter/aiSdk/runtime.ts` +- `test/main/presenter/llmProviderPresenter/aiSdkRuntime.test.ts` +- `docs/issues/openai-compatible-video-prompt-duration-fallback/tasks.md` + +## Validation +- Focused AI SDK runtime tests for video request bodies. +- `pnpm run format` +- `pnpm run i18n` +- `pnpm run lint` diff --git a/docs/issues/openai-compatible-video-prompt-duration-fallback/spec.md b/docs/issues/openai-compatible-video-prompt-duration-fallback/spec.md new file mode 100644 index 000000000..04f28d04b --- /dev/null +++ b/docs/issues/openai-compatible-video-prompt-duration-fallback/spec.md @@ -0,0 +1,25 @@ +# OpenAI-Compatible Video Prompt Duration Fallback + +## User Need +When users send prompts such as `生成 马斯克 喝酒的视频 2s` to OpenAI-compatible video models, DeepChat should preserve the obvious structured duration hint instead of sending only the raw prompt body. + +## Goal +Infer an explicit video duration from clear prompt suffixes like `5s` or `5秒` when the session has no structured video duration configured and the parsed value is valid for the target model. + +## Acceptance Criteria +1. OpenAI-compatible video requests derive `duration` from obvious prompt hints when neither `duration` nor `seconds` is already configured and the parsed value is valid for the current model. +2. Explicit structured video settings still take precedence over any prompt-derived fallback. +3. The emitted request trace matches the actual `/videos` body for this fallback. +4. Focused validation passes for the touched runtime slice. + +## Constraints +- Keep the fallback narrow and conservative; do not attempt broad natural-language parameter parsing. +- Preserve existing request-shape compatibility and polling behavior. + +## Non-Goals +- Adding or changing video settings UI. +- Parsing arbitrary style, ratio, or resolution hints from prompts. +- Changing provider safety or moderation behavior. + +## Open Questions +- None. diff --git a/docs/issues/openai-compatible-video-prompt-duration-fallback/tasks.md b/docs/issues/openai-compatible-video-prompt-duration-fallback/tasks.md new file mode 100644 index 000000000..bed18d1c6 --- /dev/null +++ b/docs/issues/openai-compatible-video-prompt-duration-fallback/tasks.md @@ -0,0 +1,11 @@ +# Tasks + +## Runtime Fallback +- [x] Add a runtime regression test for prompt-derived video duration. +- [x] Apply a conservative prompt duration fallback before building `/videos` requests. + +## Validation +- [x] Run focused AI SDK runtime tests. +- [x] Run `pnpm run format`. +- [x] Run `pnpm run i18n`. +- [x] Run `pnpm run lint`. diff --git a/electron-builder.yml b/electron-builder.yml index 3ceb532f1..1f1a84ef1 100644 --- a/electron-builder.yml +++ b/electron-builder.yml @@ -40,6 +40,9 @@ extraResources: - from: ./resources/skills/ to: app.asar.unpacked/resources/skills filter: ['**/*'] + - from: ./build/bundled-plugins/ + to: app.asar.unpacked/plugins + filter: ['**/*.dcplugin'] electronLanguages: - zh-CN - zh-TW @@ -78,10 +81,6 @@ nsis: afterSign: scripts/notarize.js afterPack: scripts/afterPack.js mac: - extraResources: - - from: ./build/bundled-plugins/ - to: app.asar.unpacked/plugins - filter: ['**/*.dcplugin'] entitlementsInherit: build/entitlements.mac.plist extendInfo: - NSCameraUsageDescription: Application requests access to the device's camera. diff --git a/package.json b/package.json index ff87a3f68..c6e7f5deb 100644 --- a/package.json +++ b/package.json @@ -1,6 +1,6 @@ { "name": "DeepChat", - "version": "1.0.4", + "version": "1.0.5-beta.1", "description": "DeepChat,一个简单易用的 Agent 客户端", "main": "./out/main/index.js", "author": "ThinkInAIXYZ", @@ -9,7 +9,7 @@ "node": ">=24.14.1 <25", "pnpm": ">=10.11.0" }, - "packageManager": "pnpm@10.13.1+sha512.37ebf1a5c7a30d5fabe0c5df44ee8da4c965ca0c5af3dbab28c3a1681b70a256218d05c81c9c0dcf767ef6b8551eb5b960042b9ed4300c59242336377e01cfad", + "packageManager": "pnpm@10.33.4+sha512.1c67b3b359b2d408119ba1ed289f34b8fc3c6873412bec6fd264fbdc82489e510fcbecb9ce9d22dae7f3b76269d8441046014bdca53b9979cd7a561ad631b800", "scripts": { "prebuild": "node scripts/fetch-provider-db.mjs && node scripts/fetch-acp-registry.mjs", "preinstall": "npx only-allow pnpm", @@ -38,30 +38,24 @@ "release:ff": "node scripts/release-fast-forward.mjs", "postinstall": "electron-builder install-app-deps && simple-git-hooks", "build:unpack": "pnpm run build && electron-builder --dir", - "build:win": "pnpm run build && electron-builder --win", - "build:win:x64": "pnpm run build && electron-builder --win --x64", - "build:win:arm64": "pnpm run build && electron-builder --win --arm64", - "plugin:cua:bundle:clean": "node -e \"require('fs').rmSync('build/bundled-plugins',{recursive:true,force:true})\"", - "plugin:cua:bundle": "pnpm run plugin:cua:bundle:clean && pnpm run plugin:cua:build && node scripts/package-plugin.mjs --release-version-from-root --target-platform darwin --out build/bundled-plugins plugins/cua", - "plugin:cua:bundle:mac:arm64": "pnpm run plugin:cua:bundle:clean && pnpm run plugin:cua:build:mac:arm64 && node scripts/package-plugin.mjs --release-version-from-root --target-platform darwin --target-arch arm64 --out build/bundled-plugins plugins/cua", - "plugin:cua:bundle:mac:x64": "pnpm run plugin:cua:bundle:clean && pnpm run plugin:cua:build:mac:x64 && node scripts/package-plugin.mjs --release-version-from-root --target-platform darwin --target-arch x64 --out build/bundled-plugins plugins/cua", + "plugin:validate": "node scripts/plugin.mjs validate", + "plugin:package": "node scripts/plugin.mjs package", + "plugin:bundle": "node scripts/plugin.mjs bundle", + "plugin:verify": "node scripts/plugin.mjs verify", + "plugin:bundle:clean": "node -e \"require('fs').rmSync('build/bundled-plugins',{recursive:true,force:true})\"", "plugin:cua:build": "node scripts/build-cua-plugin-runtime.mjs", "plugin:cua:build:mac:arm64": "node scripts/build-cua-plugin-runtime.mjs --arch arm64", "plugin:cua:build:mac:x64": "node scripts/build-cua-plugin-runtime.mjs --arch x64", - "plugin:cua:validate": "node scripts/package-plugin.mjs --validate --release-version-from-root --target-platform darwin plugins/cua", - "plugin:cua:validate:mac:arm64": "node scripts/package-plugin.mjs --validate --release-version-from-root --target-platform darwin --target-arch arm64 plugins/cua", - "plugin:cua:validate:mac:x64": "node scripts/package-plugin.mjs --validate --release-version-from-root --target-platform darwin --target-arch x64 plugins/cua", - "plugin:cua:package": "pnpm run plugin:cua:pack", - "plugin:cua:pack": "pnpm run plugin:cua:build && node scripts/package-plugin.mjs --release-version-from-root --target-platform darwin plugins/cua", - "plugin:cua:package:mac:arm64": "pnpm run plugin:cua:build:mac:arm64 && node scripts/package-plugin.mjs --release-version-from-root --target-platform darwin --target-arch arm64 plugins/cua", - "plugin:cua:package:mac:x64": "pnpm run plugin:cua:build:mac:x64 && node scripts/package-plugin.mjs --release-version-from-root --target-platform darwin --target-arch x64 plugins/cua", "install:sharp": "node scripts/install-sharp-for-platform.js", - "build:mac": "pnpm run build && pnpm run plugin:cua:bundle && electron-builder --mac", - "build:mac:arm64": "pnpm run build && pnpm run plugin:cua:bundle:mac:arm64 && electron-builder --mac --arm64", - "build:mac:x64": "pnpm run build && pnpm run plugin:cua:bundle:mac:x64 && electron-builder --mac --x64", - "build:linux": "pnpm run build && electron-builder --linux", - "build:linux:x64": "pnpm run build && electron-builder --linux --x64", - "build:linux:arm64": "pnpm run build && electron-builder --linux --arm64", + "build:mac": "pnpm run build && pnpm run plugin:bundle:clean && pnpm run plugin:cua:build && pnpm run plugin:bundle -- --name cua --platform darwin && pnpm run plugin:bundle -- --name feishu --platform darwin && electron-builder --mac", + "build:mac:arm64": "pnpm run build && pnpm run plugin:bundle:clean && pnpm run plugin:cua:build:mac:arm64 && pnpm run plugin:bundle -- --name cua --platform darwin --arch arm64 && pnpm run plugin:bundle -- --name feishu --platform darwin --arch arm64 && electron-builder --mac --arm64", + "build:mac:x64": "pnpm run build && pnpm run plugin:bundle:clean && pnpm run plugin:cua:build:mac:x64 && pnpm run plugin:bundle -- --name cua --platform darwin --arch x64 && pnpm run plugin:bundle -- --name feishu --platform darwin --arch x64 && electron-builder --mac --x64", + "build:win": "pnpm run build && pnpm run plugin:bundle:clean && pnpm run plugin:bundle -- --name feishu --platform win32 && electron-builder --win", + "build:win:x64": "pnpm run build && pnpm run plugin:bundle:clean && pnpm run plugin:bundle -- --name feishu --platform win32 --arch x64 && electron-builder --win --x64", + "build:win:arm64": "pnpm run build && pnpm run plugin:bundle:clean && pnpm run plugin:bundle -- --name feishu --platform win32 --arch arm64 && electron-builder --win --arm64", + "build:linux": "pnpm run build && pnpm run plugin:bundle:clean && pnpm run plugin:bundle -- --name feishu --platform linux && electron-builder --linux", + "build:linux:x64": "pnpm run build && pnpm run plugin:bundle:clean && pnpm run plugin:bundle -- --name feishu --platform linux --arch x64 && electron-builder --linux --x64", + "build:linux:arm64": "pnpm run build && pnpm run plugin:bundle:clean && pnpm run plugin:bundle -- --name feishu --platform linux --arch arm64 && electron-builder --linux --arm64", "afterSign": "scripts/notarize.js", "installRuntime": "npx -y tiny-runtime-injector --type uv --dir ./runtime/uv --runtime-version 0.9.18 && npx -y tiny-runtime-injector --type node --dir ./runtime/node && npx -y tiny-runtime-injector --type ripgrep --dir ./runtime/ripgrep && npx -y tiny-runtime-injector --type rtk --dir ./runtime/rtk", "installRuntime:win:x64": "npx -y tiny-runtime-injector --type uv --dir ./runtime/uv --runtime-version 0.9.18 -a x64 -p win32 && npx -y tiny-runtime-injector --type node --dir ./runtime/node -a x64 -p win32 && npx -y tiny-runtime-injector --type ripgrep --dir ./runtime/ripgrep -a x64 -p win32 && npx -y tiny-runtime-injector --type rtk --dir ./runtime/rtk -a x64 -p win32", @@ -79,139 +73,140 @@ }, "dependencies": { "@agentclientprotocol/sdk": "^0.16.1", - "@ai-sdk/amazon-bedrock": "^4.0.103", - "@ai-sdk/anthropic": "^3.0.76", - "@ai-sdk/azure": "^3.0.64", - "@ai-sdk/google": "^3.0.72", - "@ai-sdk/google-vertex": "^4.0.126", - "@ai-sdk/openai": "^3.0.63", + "@ai-sdk/amazon-bedrock": "^4.0.107", + "@ai-sdk/anthropic": "^3.0.78", + "@ai-sdk/azure": "^3.0.65", + "@ai-sdk/google": "^3.0.75", + "@ai-sdk/google-vertex": "^4.0.131", + "@ai-sdk/openai": "^3.0.64", "@ai-sdk/openai-compatible": "^2.0.47", "@ai-sdk/provider": "^3.0.10", - "@aws-sdk/client-bedrock": "^3.958.0", + "@aws-sdk/client-bedrock": "^3.1049.0", "@duckdb/node-api": "1.3.2-alpha.25", "@e2b/code-interpreter": "^1.5.1", "@electron-toolkit/preload": "^3.0.2", "@electron-toolkit/utils": "^4.0.0", "@jxa/run": "^1.4.0", - "@larksuiteoapi/node-sdk": "^1.60.0", - "@modelcontextprotocol/sdk": "^1.28.0", - "ai": "^6.0.177", - "axios": "^1.13.6", + "@larksuiteoapi/node-sdk": "^1.64.0", + "@modelcontextprotocol/sdk": "^1.29.0", + "ai": "^6.0.185", + "axios": "^1.16.1", "better-sqlite3-multiple-ciphers": "12.9.0", "cheerio": "^1.2.0", "chokidar": "^5.0.0", "compare-versions": "^6.1.1", "cross-spawn": "^7.0.6", "diff": "^8.0.4", - "electron-log": "^5.4.3", + "electron-log": "^5.4.4", "electron-store": "^8.2.0", "electron-updater": "^6.8.3", "electron-window-state": "^5.0.3", "es-mime-types": "^0.1.4", - "fflate": "^0.8.2", + "fflate": "^0.8.3", "font-list": "^2.0.2", "glob": "^13.0.6", "gray-matter": "^4.0.3", "https-proxy-agent": "^7.0.6", - "jsonrepair": "^3.13.3", + "jsonrepair": "^3.14.0", "mammoth": "^1.12.0", - "nanoid": "^5.1.7", + "nanoid": "^5.1.11", "node-pty": "^1.1.0", "ollama": "^0.6.3", "pdf-parse-new": "^1.4.1", "run-applescript": "^7.1.0", - "safe-regex2": "^5.1.0", + "safe-regex2": "^5.1.1", "sharp": "^0.33.5", "tokenx": "^0.4.1", - "turndown": "^7.2.2", - "undici": "^7.16.0", + "turndown": "^7.2.4", + "undici": "^7.25.0", "xlsx": "https://cdn.sheetjs.com/xlsx-0.20.3/xlsx-0.20.3.tgz", "xml2js": "^0.6.2", "zod": "^3.25.76" }, "devDependencies": { - "@antv/infographic": "^0.2.7", + "@antv/infographic": "^0.2.19", "@electron-toolkit/tsconfig": "^1.0.1", "@electron/notarize": "^3.1.1", - "@iconify-json/lucide": "^1.2.99", - "@iconify-json/vscode-icons": "^1.2.45", - "@iconify/vue": "^5.0.0", + "@iconify-json/lucide": "^1.2.108", + "@iconify-json/vscode-icons": "^1.2.49", + "@iconify/vue": "^5.0.1", "@lingual/i18n-check": "0.8.12", "@pinia/colada": "^0.20.0", - "@playwright/test": "^1.59.1", + "@playwright/test": "^1.60.0", "@tailwindcss/typography": "^0.5.19", - "@tailwindcss/vite": "^4.2.2", - "@tiptap/core": "^2.11.7", - "@tiptap/extension-code-block": "^2.11.9", - "@tiptap/extension-document": "^2.11.7", - "@tiptap/extension-hard-break": "^2.11.7", - "@tiptap/extension-history": "^2.12.0", - "@tiptap/extension-mention": "^2.11.7", - "@tiptap/extension-paragraph": "^2.11.7", - "@tiptap/extension-placeholder": "^2.11.7", - "@tiptap/extension-text": "^2.11.7", - "@tiptap/pm": "^2.11.7", - "@tiptap/suggestion": "^2.11.7", - "@tiptap/vue-3": "^2.11.7", + "@tailwindcss/vite": "^4.3.0", + "@tiptap/core": "^2.27.2", + "@tiptap/extension-code-block": "^2.27.2", + "@tiptap/extension-document": "^2.27.2", + "@tiptap/extension-hard-break": "^2.27.2", + "@tiptap/extension-history": "^2.27.2", + "@tiptap/extension-mention": "^2.27.2", + "@tiptap/extension-paragraph": "^2.27.2", + "@tiptap/extension-placeholder": "^2.27.2", + "@tiptap/extension-text": "^2.27.2", + "@tiptap/pm": "^2.27.2", + "@tiptap/suggestion": "^2.27.2", + "@tiptap/vue-3": "^2.27.2", "@types/better-sqlite3": "^7.6.13", "@types/mime-types": "^3.0.1", - "@types/node": "^24.12.2", + "@types/node": "^24.12.4", "@types/xlsx": "^0.0.35", - "@typescript/native-preview": "7.0.0-dev.20260115.1", + "@typescript/native-preview": "7.0.0-dev.20260518.1", "@unovis/ts": "1.6.4", "@unovis/vue": "1.6.4", "@vee-validate/zod": "^4.15.1", - "@vitejs/plugin-vue": "^6.0.5", + "@vitejs/plugin-vue": "^6.0.7", "@vitest/ui": "^3.2.4", - "@vue/test-utils": "^2.4.6", + "@vue/test-utils": "^2.4.10", "@vueuse/core": "^12.8.2", "@xterm/addon-fit": "^0.10.0", "@xterm/xterm": "^5.5.0", - "autoprefixer": "^10.4.23", + "autoprefixer": "^10.5.0", "class-variance-authority": "^0.7.1", "clsx": "^2.1.1", "cross-env": "^10.1.0", - "dayjs": "^1.11.19", - "electron": "^40.9.2", + "dayjs": "^1.11.20", + "electron": "^40.10.0", "electron-builder": "26.9.0", "electron-vite": "5.0.0", "jsdom": "^26.1.0", - "katex": "^0.16.27", + "katex": "^0.16.47", "lint-staged": "^16.4.0", "lucide-vue-next": "^0.544.0", - "markstream-vue": "0.0.14-beta.8", - "mermaid": "^11.13.0", - "minimatch": "^10.2.4", + "markstream-vue": "1.0.0-rc.0", + "mermaid": "^11.15.0", + "minimatch": "^10.2.5", "monaco-editor": "^0.55.1", "oxfmt": "^0.42.0", - "oxlint": "^1.57.0", + "oxlint": "^1.65.0", "picocolors": "^1.1.1", "pinia": "^3.0.4", - "reka-ui": "^2.9.2", + "reka-ui": "^2.9.7", "simple-git-hooks": "^2.13.1", "stream-monaco": "^0.0.40", - "tailwind-merge": "^3.5.0", + "tailwind-merge": "^3.6.0", "tailwind-scrollbar-hide": "^4.0.0", - "tailwindcss": "^4.2.2", + "tailwindcss": "^4.3.0", "tailwindcss-animate": "^1.0.7", + "taze": "^19.12.0", "tippy.js": "^6.3.7", "tw-animate-css": "^1.4.0", "typescript": "^5.9.3", "vee-validate": "^4.15.1", - "vite": "^7.3.1", + "vite": "^7.3.3", "vite-plugin-monaco-editor-esm": "^2.0.2", - "vite-plugin-vue-devtools": "^8.1.1", + "vite-plugin-vue-devtools": "^8.1.2", "vite-svg-loader": "^5.1.1", "vitest": "^3.2.4", - "vue": "^3.5.31", - "vue-i18n": "^11.3.0", + "vue": "^3.5.34", + "vue-i18n": "^11.4.4", "vue-router": "4", "vue-sonner": "^2.0.9", - "vue-tsgo": "0.0.1-yggdrasill.11", - "vue-virtual-scroller": "^3.0.0", + "vue-tsgo": "0.2.2", + "vue-virtual-scroller": "^3.0.3", "vuedraggable": "^4.1.0", - "yaml": "^2.8.3", - "zod-to-json-schema": "^3.25.1" + "yaml": "^2.9.0", + "zod-to-json-schema": "^3.25.2" }, "simple-git-hooks": { "pre-commit": "node scripts/pre-commit.mjs", diff --git a/plugins/feishu/plugin.json b/plugins/feishu/plugin.json index 8da49a279..2d0081ed9 100644 --- a/plugins/feishu/plugin.json +++ b/plugins/feishu/plugin.json @@ -11,7 +11,7 @@ "capabilities": ["runtime.manage", "mcp.register", "skills.register", "settings.contribute"], "source": { "type": "deepchat-official", - "url": "${github.release.download}/deepchat-plugin-feishu-${app.version}-${arch}.dcplugin", + "url": "${github.release.download}/deepchat-plugin-feishu-${app.version}-${target.platform}-${arch}.dcplugin", "publisher": "DeepChat" }, "mcpServers": [ diff --git a/resources/acp-registry/registry.json b/resources/acp-registry/registry.json index 7a4b51aab..759b3e401 100644 --- a/resources/acp-registry/registry.json +++ b/resources/acp-registry/registry.json @@ -61,7 +61,7 @@ { "id": "auggie", "name": "Auggie CLI", - "version": "0.26.0", + "version": "0.27.2", "description": "Augment Code's powerful software agent, backed by industry-leading context engine", "repository": "https://github.com/augmentcode/auggie", "website": "https://www.augmentcode.com/", @@ -72,7 +72,7 @@ "icon": "https://cdn.agentclientprotocol.com/registry/v1/latest/auggie.svg", "distribution": { "npx": { - "package": "@augmentcode/auggie@0.26.0", + "package": "@augmentcode/auggie@0.27.2", "args": [ "--acp" ], @@ -103,7 +103,7 @@ { "id": "claude-acp", "name": "Claude Agent", - "version": "0.33.1", + "version": "0.36.1", "description": "ACP wrapper for Anthropic's Claude", "repository": "https://github.com/agentclientprotocol/claude-agent-acp", "authors": [ @@ -114,7 +114,7 @@ "license": "proprietary", "distribution": { "npx": { - "package": "@agentclientprotocol/claude-agent-acp@0.33.1" + "package": "@agentclientprotocol/claude-agent-acp@0.36.1" } }, "icon": "https://cdn.agentclientprotocol.com/registry/v1/latest/claude-acp.svg" @@ -122,7 +122,7 @@ { "id": "cline", "name": "Cline", - "version": "2.18.0", + "version": "3.0.7", "description": "Autonomous coding agent CLI - capable of creating/editing files, running commands, using the browser, and more", "repository": "https://github.com/cline/cline", "website": "https://cline.bot/cli", @@ -133,7 +133,7 @@ "icon": "https://cdn.agentclientprotocol.com/registry/v1/latest/cline.svg", "distribution": { "npx": { - "package": "cline@2.18.0", + "package": "cline@3.0.7", "args": [ "--acp" ] @@ -143,7 +143,7 @@ { "id": "codebuddy-code", "name": "Codebuddy Code", - "version": "2.96.0", + "version": "2.97.3", "description": "Tencent Cloud's official intelligent coding tool", "website": "https://www.codebuddy.cn/cli/", "authors": [ @@ -152,7 +152,7 @@ "license": "Proprietary", "distribution": { "npx": { - "package": "@tencent-ai/codebuddy-code@2.96.0", + "package": "@tencent-ai/codebuddy-code@2.97.3", "args": [ "--acp" ] @@ -271,7 +271,7 @@ { "id": "corust-agent", "name": "Corust Agent", - "version": "0.5.1", + "version": "0.6.0", "description": "Co-building with a seasoned Rust partner.", "repository": "https://github.com/Corust-ai/corust-agent-release", "website": "https://corust.ai/", @@ -282,19 +282,19 @@ "distribution": { "binary": { "darwin-aarch64": { - "archive": "https://github.com/Corust-ai/corust-agent-release/releases/download/v0.5.1/agent-darwin-arm64.tar.gz", + "archive": "https://github.com/Corust-ai/corust-agent-release/releases/download/v0.6.0/agent-darwin-arm64.tar.gz", "cmd": "./corust-agent-acp" }, "darwin-x86_64": { - "archive": "https://github.com/Corust-ai/corust-agent-release/releases/download/v0.5.1/agent-darwin-x64.tar.gz", + "archive": "https://github.com/Corust-ai/corust-agent-release/releases/download/v0.6.0/agent-darwin-x64.tar.gz", "cmd": "./corust-agent-acp" }, "linux-x86_64": { - "archive": "https://github.com/Corust-ai/corust-agent-release/releases/download/v0.5.1/agent-linux-x64.tar.gz", + "archive": "https://github.com/Corust-ai/corust-agent-release/releases/download/v0.6.0/agent-linux-x64.tar.gz", "cmd": "./corust-agent-acp" }, "windows-x86_64": { - "archive": "https://github.com/Corust-ai/corust-agent-release/releases/download/v0.5.1/agent-windows-x64.zip", + "archive": "https://github.com/Corust-ai/corust-agent-release/releases/download/v0.6.0/agent-windows-x64.zip", "cmd": "./corust-agent-acp.exe" } } @@ -453,7 +453,7 @@ { "id": "dirac", "name": "Dirac", - "version": "0.3.41", + "version": "0.3.44", "description": "Reduces API costs by more than 50%, produces better and faster work. Uses Hash anchored parallel edits, AST manipulation and a whole lot of neat optimizations. Fully Open Source.", "repository": "https://github.com/dirac-run/dirac", "website": "https://dirac.run", @@ -464,7 +464,7 @@ "icon": "https://cdn.agentclientprotocol.com/registry/v1/latest/dirac.svg", "distribution": { "npx": { - "package": "dirac-cli@0.3.41", + "package": "dirac-cli@0.3.44", "args": [ "--acp" ] @@ -474,7 +474,7 @@ { "id": "factory-droid", "name": "Factory Droid", - "version": "0.122.0", + "version": "0.129.0", "description": "Factory Droid - AI coding agent powered by Factory AI", "website": "https://factory.ai/product/cli", "authors": [ @@ -483,7 +483,7 @@ "license": "proprietary", "distribution": { "npx": { - "package": "droid@0.122.0", + "package": "droid@0.129.0", "args": [ "exec", "--output-format", @@ -500,7 +500,7 @@ { "id": "fast-agent", "name": "fast-agent", - "version": "0.7.2", + "version": "0.7.6", "description": "Code and build agents with comprehensive multi-provider support", "repository": "https://github.com/evalstate/fast-agent", "website": "https://fast-agent.ai", @@ -510,7 +510,7 @@ "license": "Apache 2.0", "distribution": { "uvx": { - "package": "fast-agent-acp==0.7.2", + "package": "fast-agent-acp==0.7.6", "args": [ "-x" ] @@ -521,7 +521,7 @@ { "id": "gemini", "name": "Gemini CLI", - "version": "0.41.2", + "version": "0.42.0", "description": "Google's official CLI for Gemini", "repository": "https://github.com/google-gemini/gemini-cli", "website": "https://geminicli.com", @@ -531,7 +531,7 @@ "license": "Apache-2.0", "distribution": { "npx": { - "package": "@google/gemini-cli@0.41.2", + "package": "@google/gemini-cli@0.42.0", "args": [ "--acp" ] @@ -542,7 +542,7 @@ { "id": "github-copilot-cli", "name": "GitHub Copilot", - "version": "1.0.45", + "version": "1.0.49", "description": "GitHub's AI pair programmer", "repository": "https://github.com/github/copilot-cli", "website": "https://github.com/features/copilot/cli/", @@ -552,7 +552,7 @@ "license": "proprietary", "distribution": { "npx": { - "package": "@github/copilot@1.0.45", + "package": "@github/copilot@1.0.49", "args": [ "--acp" ] @@ -563,7 +563,7 @@ { "id": "glm-acp-agent", "name": "GLM Agent", - "version": "1.1.3", + "version": "1.1.4", "description": "ACP agent powered by Zhipu AI's GLM Coding Plan models (glm-5.1, glm-5-turbo, glm-4.7, glm-4.5-air). Supports streaming, tool calls, mid-session model switching, image input via Z.AI Coding Plan Vision MCP, and session load/fork/resume with on-disk persistence.", "repository": "https://github.com/stefandevo/glm-acp-agent", "authors": [ @@ -573,14 +573,14 @@ "icon": "https://cdn.agentclientprotocol.com/registry/v1/latest/glm-acp-agent.svg", "distribution": { "npx": { - "package": "glm-acp-agent@1.1.3" + "package": "glm-acp-agent@1.1.4" } } }, { "id": "goose", "name": "goose", - "version": "1.33.1", + "version": "1.34.1", "description": "A local, extensible, open source AI agent that automates engineering tasks", "repository": "https://github.com/block/goose", "website": "https://block.github.io/goose/", @@ -591,35 +591,35 @@ "distribution": { "binary": { "darwin-aarch64": { - "archive": "https://github.com/block/goose/releases/download/v1.33.1/goose-aarch64-apple-darwin.tar.bz2", + "archive": "https://github.com/block/goose/releases/download/v1.34.1/goose-aarch64-apple-darwin.tar.bz2", "cmd": "./goose", "args": [ "acp" ] }, "darwin-x86_64": { - "archive": "https://github.com/block/goose/releases/download/v1.33.1/goose-x86_64-apple-darwin.tar.bz2", + "archive": "https://github.com/block/goose/releases/download/v1.34.1/goose-x86_64-apple-darwin.tar.bz2", "cmd": "./goose", "args": [ "acp" ] }, "linux-aarch64": { - "archive": "https://github.com/block/goose/releases/download/v1.33.1/goose-aarch64-unknown-linux-gnu.tar.bz2", + "archive": "https://github.com/block/goose/releases/download/v1.34.1/goose-aarch64-unknown-linux-gnu.tar.bz2", "cmd": "./goose", "args": [ "acp" ] }, "linux-x86_64": { - "archive": "https://github.com/block/goose/releases/download/v1.33.1/goose-x86_64-unknown-linux-gnu.tar.bz2", + "archive": "https://github.com/block/goose/releases/download/v1.34.1/goose-x86_64-unknown-linux-gnu.tar.bz2", "cmd": "./goose", "args": [ "acp" ] }, "windows-x86_64": { - "archive": "https://github.com/block/goose/releases/download/v1.33.1/goose-x86_64-pc-windows-msvc.zip", + "archive": "https://github.com/block/goose/releases/download/v1.34.1/goose-x86_64-pc-windows-msvc.zip", "cmd": "./goose-package\\goose.exe", "args": [ "acp" @@ -632,7 +632,7 @@ { "id": "junie", "name": "Junie", - "version": "1543.24.0", + "version": "1588.20.0", "description": "AI Coding Agent by JetBrains", "repository": "https://github.com/JetBrains/junie", "website": "https://junie.jetbrains.com", @@ -643,35 +643,35 @@ "distribution": { "binary": { "darwin-aarch64": { - "archive": "https://github.com/JetBrains/junie/releases/download/1543.24/junie-release-1543.24-macos-aarch64.zip", + "archive": "https://github.com/JetBrains/junie/releases/download/1588.20/junie-release-1588.20-macos-aarch64.zip", "cmd": "./Applications/junie.app/Contents/MacOS/junie", "args": [ "--acp=true" ] }, "darwin-x86_64": { - "archive": "https://github.com/JetBrains/junie/releases/download/1543.24/junie-release-1543.24-macos-amd64.zip", + "archive": "https://github.com/JetBrains/junie/releases/download/1588.20/junie-release-1588.20-macos-amd64.zip", "cmd": "./Applications/junie.app/Contents/MacOS/junie", "args": [ "--acp=true" ] }, "linux-aarch64": { - "archive": "https://github.com/JetBrains/junie/releases/download/1543.24/junie-release-1543.24-linux-aarch64.zip", + "archive": "https://github.com/JetBrains/junie/releases/download/1588.20/junie-release-1588.20-linux-aarch64.zip", "cmd": "./junie-app/bin/junie", "args": [ "--acp=true" ] }, "linux-x86_64": { - "archive": "https://github.com/JetBrains/junie/releases/download/1543.24/junie-release-1543.24-linux-amd64.zip", + "archive": "https://github.com/JetBrains/junie/releases/download/1588.20/junie-release-1588.20-linux-amd64.zip", "cmd": "./junie-app/bin/junie", "args": [ "--acp=true" ] }, "windows-x86_64": { - "archive": "https://github.com/JetBrains/junie/releases/download/1543.24/junie-release-1543.24-windows-amd64.zip", + "archive": "https://github.com/JetBrains/junie/releases/download/1588.20/junie-release-1588.20-windows-amd64.zip", "cmd": "./junie/junie.exe", "args": [ "--acp=true" @@ -684,7 +684,7 @@ { "id": "kilo", "name": "Kilo", - "version": "7.2.52", + "version": "7.3.0", "description": "The open source coding agent", "repository": "https://github.com/Kilo-Org/kilocode", "website": "https://kilo.ai/", @@ -696,35 +696,35 @@ "distribution": { "binary": { "darwin-aarch64": { - "archive": "https://github.com/Kilo-Org/kilocode/releases/download/v7.2.52/kilo-darwin-arm64.zip", + "archive": "https://github.com/Kilo-Org/kilocode/releases/download/v7.3.0/kilo-darwin-arm64.zip", "cmd": "./kilo", "args": [ "acp" ] }, "darwin-x86_64": { - "archive": "https://github.com/Kilo-Org/kilocode/releases/download/v7.2.52/kilo-darwin-x64.zip", + "archive": "https://github.com/Kilo-Org/kilocode/releases/download/v7.3.0/kilo-darwin-x64.zip", "cmd": "./kilo", "args": [ "acp" ] }, "linux-aarch64": { - "archive": "https://github.com/Kilo-Org/kilocode/releases/download/v7.2.52/kilo-linux-arm64.tar.gz", + "archive": "https://github.com/Kilo-Org/kilocode/releases/download/v7.3.0/kilo-linux-arm64.tar.gz", "cmd": "./kilo", "args": [ "acp" ] }, "linux-x86_64": { - "archive": "https://github.com/Kilo-Org/kilocode/releases/download/v7.2.52/kilo-linux-x64.tar.gz", + "archive": "https://github.com/Kilo-Org/kilocode/releases/download/v7.3.0/kilo-linux-x64.tar.gz", "cmd": "./kilo", "args": [ "acp" ] }, "windows-x86_64": { - "archive": "https://github.com/Kilo-Org/kilocode/releases/download/v7.2.52/kilo-windows-x64.zip", + "archive": "https://github.com/Kilo-Org/kilocode/releases/download/v7.3.0/kilo-windows-x64.zip", "cmd": "./kilo.exe", "args": [ "acp" @@ -732,7 +732,7 @@ } }, "npx": { - "package": "@kilocode/cli@7.2.52", + "package": "@kilocode/cli@7.3.0", "args": [ "acp" ] @@ -742,7 +742,7 @@ { "id": "kimi", "name": "Kimi CLI", - "version": "1.42.0", + "version": "1.44.0", "description": "Moonshot AI's coding assistant", "repository": "https://github.com/MoonshotAI/kimi-cli", "website": "https://moonshotai.github.io/kimi-cli/", @@ -753,28 +753,28 @@ "distribution": { "binary": { "darwin-aarch64": { - "archive": "https://github.com/MoonshotAI/kimi-cli/releases/download/1.42.0/kimi-1.42.0-aarch64-apple-darwin.tar.gz", + "archive": "https://github.com/MoonshotAI/kimi-cli/releases/download/1.44.0/kimi-1.44.0-aarch64-apple-darwin.tar.gz", "cmd": "./kimi", "args": [ "acp" ] }, "linux-aarch64": { - "archive": "https://github.com/MoonshotAI/kimi-cli/releases/download/1.42.0/kimi-1.42.0-aarch64-unknown-linux-gnu.tar.gz", + "archive": "https://github.com/MoonshotAI/kimi-cli/releases/download/1.44.0/kimi-1.44.0-aarch64-unknown-linux-gnu.tar.gz", "cmd": "./kimi", "args": [ "acp" ] }, "linux-x86_64": { - "archive": "https://github.com/MoonshotAI/kimi-cli/releases/download/1.42.0/kimi-1.42.0-x86_64-unknown-linux-gnu.tar.gz", + "archive": "https://github.com/MoonshotAI/kimi-cli/releases/download/1.44.0/kimi-1.44.0-x86_64-unknown-linux-gnu.tar.gz", "cmd": "./kimi", "args": [ "acp" ] }, "windows-x86_64": { - "archive": "https://github.com/MoonshotAI/kimi-cli/releases/download/1.42.0/kimi-1.42.0-x86_64-pc-windows-msvc.zip", + "archive": "https://github.com/MoonshotAI/kimi-cli/releases/download/1.44.0/kimi-1.44.0-x86_64-pc-windows-msvc.zip", "cmd": "./kimi.exe", "args": [ "acp" @@ -848,7 +848,7 @@ { "id": "nova", "name": "Nova", - "version": "1.1.8", + "version": "1.1.9", "description": "Nova by Compass AI - a fully-fledged software engineer at your command", "repository": "https://github.com/Compass-Agentic-Platform/nova", "website": "https://www.compassap.ai/portfolio/nova.html", @@ -859,7 +859,7 @@ "icon": "https://cdn.agentclientprotocol.com/registry/v1/latest/nova.svg", "distribution": { "npx": { - "package": "@compass-ai/nova@1.1.8", + "package": "@compass-ai/nova@1.1.9", "args": [ "acp" ] @@ -869,7 +869,7 @@ { "id": "opencode", "name": "OpenCode", - "version": "1.14.48", + "version": "1.15.5", "description": "The open source coding agent", "repository": "https://github.com/anomalyco/opencode", "website": "https://opencode.ai", @@ -881,42 +881,42 @@ "distribution": { "binary": { "darwin-aarch64": { - "archive": "https://github.com/anomalyco/opencode/releases/download/v1.14.48/opencode-darwin-arm64.zip", + "archive": "https://github.com/anomalyco/opencode/releases/download/v1.15.5/opencode-darwin-arm64.zip", "cmd": "./opencode", "args": [ "acp" ] }, "darwin-x86_64": { - "archive": "https://github.com/anomalyco/opencode/releases/download/v1.14.48/opencode-darwin-x64.zip", + "archive": "https://github.com/anomalyco/opencode/releases/download/v1.15.5/opencode-darwin-x64.zip", "cmd": "./opencode", "args": [ "acp" ] }, "linux-aarch64": { - "archive": "https://github.com/anomalyco/opencode/releases/download/v1.14.48/opencode-linux-arm64.tar.gz", + "archive": "https://github.com/anomalyco/opencode/releases/download/v1.15.5/opencode-linux-arm64.tar.gz", "cmd": "./opencode", "args": [ "acp" ] }, "linux-x86_64": { - "archive": "https://github.com/anomalyco/opencode/releases/download/v1.14.48/opencode-linux-x64.tar.gz", + "archive": "https://github.com/anomalyco/opencode/releases/download/v1.15.5/opencode-linux-x64.tar.gz", "cmd": "./opencode", "args": [ "acp" ] }, "windows-aarch64": { - "archive": "https://github.com/anomalyco/opencode/releases/download/v1.14.48/opencode-windows-arm64.zip", + "archive": "https://github.com/anomalyco/opencode/releases/download/v1.15.5/opencode-windows-arm64.zip", "cmd": "./opencode", "args": [ "acp" ] }, "windows-x86_64": { - "archive": "https://github.com/anomalyco/opencode/releases/download/v1.14.48/opencode-windows-x64.zip", + "archive": "https://github.com/anomalyco/opencode/releases/download/v1.15.5/opencode-windows-x64.zip", "cmd": "./opencode.exe", "args": [ "acp" @@ -928,7 +928,7 @@ { "id": "pi-acp", "name": "pi ACP", - "version": "0.0.26", + "version": "0.0.27", "description": "ACP adapter for pi coding agent", "repository": "https://github.com/svkozak/pi-acp", "authors": [ @@ -937,7 +937,7 @@ "license": "MIT", "distribution": { "npx": { - "package": "pi-acp@0.0.26" + "package": "pi-acp@0.0.27" } }, "icon": "https://cdn.agentclientprotocol.com/registry/v1/latest/pi-acp.svg" @@ -1003,7 +1003,7 @@ { "id": "qoder", "name": "Qoder CLI", - "version": "0.2.12", + "version": "0.2.14", "description": "AI coding assistant with agentic capabilities", "website": "https://qoder.com", "authors": [ @@ -1013,7 +1013,7 @@ "icon": "https://cdn.agentclientprotocol.com/registry/v1/latest/qoder.svg", "distribution": { "npx": { - "package": "@qoder-ai/qodercli@0.2.12", + "package": "@qoder-ai/qodercli@0.2.14", "args": [ "--acp" ] @@ -1023,7 +1023,7 @@ { "id": "qwen-code", "name": "Qwen Code", - "version": "0.15.10", + "version": "0.15.11", "description": "Alibaba's Qwen coding assistant", "repository": "https://github.com/QwenLM/qwen-code", "website": "https://qwenlm.github.io/qwen-code-docs/en/users/overview", @@ -1033,7 +1033,7 @@ "license": "Apache-2.0", "distribution": { "npx": { - "package": "@qwen-code/qwen-code@0.15.10", + "package": "@qwen-code/qwen-code@0.15.11", "args": [ "--acp", "--experimental-skills" @@ -1089,7 +1089,7 @@ { "id": "stakpak", "name": "Stakpak", - "version": "0.3.80", + "version": "0.3.81", "description": "Open-source DevOps agent in Rust with enterprise-grade security", "repository": "https://github.com/stakpak/agent", "website": "https://stakpak.dev", @@ -1101,35 +1101,35 @@ "distribution": { "binary": { "darwin-aarch64": { - "archive": "https://github.com/stakpak/agent/releases/download/v0.3.80/stakpak-darwin-aarch64.tar.gz", + "archive": "https://github.com/stakpak/agent/releases/download/v0.3.81/stakpak-darwin-aarch64.tar.gz", "cmd": "./stakpak", "args": [ "acp" ] }, "darwin-x86_64": { - "archive": "https://github.com/stakpak/agent/releases/download/v0.3.80/stakpak-darwin-x86_64.tar.gz", + "archive": "https://github.com/stakpak/agent/releases/download/v0.3.81/stakpak-darwin-x86_64.tar.gz", "cmd": "./stakpak", "args": [ "acp" ] }, "linux-aarch64": { - "archive": "https://github.com/stakpak/agent/releases/download/v0.3.80/stakpak-linux-aarch64.tar.gz", + "archive": "https://github.com/stakpak/agent/releases/download/v0.3.81/stakpak-linux-aarch64.tar.gz", "cmd": "./stakpak", "args": [ "acp" ] }, "linux-x86_64": { - "archive": "https://github.com/stakpak/agent/releases/download/v0.3.80/stakpak-linux-x86_64.tar.gz", + "archive": "https://github.com/stakpak/agent/releases/download/v0.3.81/stakpak-linux-x86_64.tar.gz", "cmd": "./stakpak", "args": [ "acp" ] }, "windows-x86_64": { - "archive": "https://github.com/stakpak/agent/releases/download/v0.3.80/stakpak-windows-x86_64.zip", + "archive": "https://github.com/stakpak/agent/releases/download/v0.3.81/stakpak-windows-x86_64.zip", "cmd": "./stakpak.exe", "args": [ "acp" diff --git a/resources/model-db/providers.json b/resources/model-db/providers.json index fb0dc972c..6cccbe57e 100644 --- a/resources/model-db/providers.json +++ b/resources/model-db/providers.json @@ -1,59 +1,52 @@ { "providers": { - "302ai": { - "id": "302ai", - "name": "302.AI", - "display_name": "302.AI", - "api": "https://api.302.ai/v1", - "doc": "https://doc.302.ai", + "helicone": { + "id": "helicone", + "name": "Helicone", + "display_name": "Helicone", + "api": "https://ai-gateway.helicone.ai/v1", + "doc": "https://helicone.ai/models", "models": [ { - "id": "qwen3-235b-a22b", - "name": "Qwen3-235B-A22B", - "display_name": "Qwen3-235B-A22B", + "id": "claude-opus-4-1-20250805", + "name": "Anthropic: Claude Opus 4.1 (20250805)", + "display_name": "Anthropic: Claude Opus 4.1 (20250805)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.29, - "output": 2.86 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "grok-4.1", - "name": "grok-4.1", - "display_name": "grok-4.1", + "id": "claude-3.7-sonnet", + "name": "Anthropic: Claude 3.7 Sonnet", + "display_name": "Anthropic: Claude 3.7 Sonnet", "modalities": { "input": [ "text", @@ -70,59 +63,79 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2025-02", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 2, - "output": 10 + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "MiniMax-M2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "mistral-small", + "name": "Mistral Small", + "display_name": "Mistral Small", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 128000, "output": 128000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-10-26", - "last_updated": "2025-10-26", + "knowledge": "2024-02", + "release_date": "2024-02-26", + "last_updated": "2024-02-26", "cost": { - "input": 0.33, - "output": 1.32 + "input": 75, + "output": 200 }, "type": "chat" }, { - "id": "grok-4-1-fast-reasoning", - "name": "grok-4-1-fast-reasoning", - "display_name": "grok-4-1-fast-reasoning", + "id": "chatgpt-4o-latest", + "name": "OpenAI ChatGPT-4o", + "display_name": "OpenAI ChatGPT-4o", "modalities": { "input": [ "text", @@ -133,127 +146,95 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-11-20", - "last_updated": "2025-11-20", + "knowledge": "2024-08", + "release_date": "2024-08-14", + "last_updated": "2024-08-14", "cost": { - "input": 0.2, - "output": 0.5 + "input": 5, + "output": 20, + "cache_read": 2.5 }, "type": "chat" }, { - "id": "gemini-2.5-flash-nothink", - "name": "gemini-2.5-flash-nothink", - "display_name": "gemini-2.5-flash-nothink", + "id": "kimi-k2-0905", + "name": "Kimi K2 (09/05)", + "display_name": "Kimi K2 (09/05)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-24", - "last_updated": "2025-06-24", + "knowledge": "2025-09", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.3, - "output": 2.5 + "input": 0.5, + "output": 2, + "cache_read": 0.39999999999999997 }, "type": "chat" }, { - "id": "grok-4.20-multi-agent-beta-0309", - "name": "grok-4.20-multi-agent-beta-0309", - "display_name": "grok-4.20-multi-agent-beta-0309", + "id": "gemma2-9b-it", + "name": "Google Gemma 2", + "display_name": "Google Gemma 2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "knowledge": "2024-06", + "release_date": "2024-06-25", + "last_updated": "2024-06-25", "cost": { - "input": 2, - "output": 6 + "input": 0.01, + "output": 0.03 }, "type": "chat" }, { - "id": "kimi-k2-0905-preview", - "name": "kimi-k2-0905-preview", - "display_name": "kimi-k2-0905-preview", + "id": "llama-3.1-8b-instant", + "name": "Meta Llama 3.1 8B Instant", + "display_name": "Meta Llama 3.1 8B Instant", "modalities": { "input": [ "text" @@ -263,8 +244,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 32678 }, "temperature": true, "tool_call": true, @@ -273,158 +254,131 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2024-07", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.632, - "output": 2.53 + "input": 0.049999999999999996, + "output": 0.08 }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "claude-haiku-4-5", - "display_name": "claude-haiku-4-5", + "id": "mistral-large-2411", + "name": "Mistral-Large", + "display_name": "Mistral-Large", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-16", - "last_updated": "2025-10-16", + "knowledge": "2024-07", + "release_date": "2024-07-24", + "last_updated": "2024-07-24", "cost": { - "input": 1, - "output": 5 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "claude-opus-4-5-20251101", - "name": "claude-opus-4-5-20251101", - "display_name": "claude-opus-4-5-20251101", + "id": "gpt-4o", + "name": "OpenAI GPT-4o", + "display_name": "OpenAI GPT-4o", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-25", - "last_updated": "2025-11-25", + "knowledge": "2024-05", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 5, - "output": 25 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-09-2025", - "name": "gemini-2.5-flash-lite-preview-09-2025", - "display_name": "gemini-2.5-flash-lite-preview-09-2025", + "id": "qwen3-vl-235b-a22b-instruct", + "name": "Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen3 VL 235B A22B Instruct", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-26", - "last_updated": "2025-09-26", + "knowledge": "2025-09", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.3, + "output": 1.5 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "qwen3-235b-a22b-instruct-2507", - "display_name": "qwen3-235b-a22b-instruct-2507", + "id": "claude-3-haiku-20240307", + "name": "Anthropic: Claude 3 Haiku", + "display_name": "Anthropic: Claude 3 Haiku", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -433,112 +387,100 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "knowledge": "2024-03", + "release_date": "2024-03-07", + "last_updated": "2024-03-07", "cost": { - "input": 0.29, - "output": 1.143 + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "glm-5v-turbo", - "name": "GLM-5V-Turbo", - "display_name": "GLM-5V-Turbo", + "id": "sonar-reasoning", + "name": "Perplexity Sonar Reasoning", + "display_name": "Perplexity Sonar Reasoning", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 127000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0.72, - "output": 3.2 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "mistral-large-2512", - "name": "mistral-large-2512", - "display_name": "mistral-large-2512", + "id": "llama-prompt-guard-2-22m", + "name": "Meta Llama Prompt Guard 2 22M", + "display_name": "Meta Llama Prompt Guard 2 22M", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 262144 + "context": 512, + "output": 2 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 1.1, - "output": 3.3 + "input": 0.01, + "output": 0.01 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "glm-4.7", - "display_name": "glm-4.7", + "id": "o3-pro", + "name": "OpenAI o3 Pro", + "display_name": "OpenAI o3 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -547,34 +489,36 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.286, - "output": 1.142 + "input": 20, + "output": 80 }, "type": "chat" }, { - "id": "claude-3-5-haiku-20241022", - "name": "claude-3-5-haiku-20241022", - "display_name": "claude-3-5-haiku-20241022", + "id": "claude-haiku-4-5-20251001", + "name": "Anthropic: Claude 4.5 Haiku (20251001)", + "display_name": "Anthropic: Claude 4.5 Haiku (20251001)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -589,21 +533,23 @@ "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2025-10", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", "cost": { - "input": 0.8, - "output": 4 + "input": 1, + "output": 5, + "cache_read": 0.09999999999999999, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "doubao-seed-1-8-251215", - "name": "doubao-seed-1-8-251215", - "display_name": "doubao-seed-1-8-251215", + "id": "gpt-4.1-mini-2025-04-14", + "name": "OpenAI GPT-4.1 Mini", + "display_name": "OpenAI GPT-4.1 Mini", "modalities": { "input": [ "text", @@ -614,28 +560,30 @@ ] }, "limit": { - "context": 224000, - "output": 64000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-18", - "last_updated": "2025-12-18", + "knowledge": "2025-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.114, - "output": 0.286 + "input": 0.39999999999999997, + "output": 1.5999999999999999, + "cache_read": 0.09999999999999999 }, "type": "chat" }, { - "id": "chatgpt-4o-latest", - "name": "chatgpt-4o-latest", - "display_name": "chatgpt-4o-latest", + "id": "gemini-2.5-pro", + "name": "Google Gemini 2.5 Pro", + "display_name": "Google Gemini 2.5 Pro", "modalities": { "input": [ "text", @@ -646,40 +594,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-08-08", - "last_updated": "2024-08-08", - "cost": { - "input": 5, - "output": 15 - }, - "type": "chat" - }, - { - "id": "glm-5", - "name": "glm-5", - "display_name": "glm-5", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 204800, - "output": 131072 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -690,31 +606,43 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.6, - "output": 2.6 + "input": 1.25, + "output": 10, + "cache_read": 0.3125, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "deepseek-chat", - "name": "Deepseek-Chat", - "display_name": "Deepseek-Chat", + "id": "gpt-5-chat-latest", + "name": "OpenAI GPT-5 Chat Latest", + "display_name": "OpenAI GPT-5 Chat Latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -722,28 +650,29 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-11-29", - "last_updated": "2024-11-29", + "knowledge": "2024-09", + "release_date": "2024-09-30", + "last_updated": "2024-09-30", "cost": { - "input": 0.29, - "output": 0.43 + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 }, "type": "chat" }, { - "id": "deepseek-v3.2-thinking", - "name": "DeepSeek-V3.2-Thinking", - "display_name": "DeepSeek-V3.2-Thinking", + "id": "grok-3-mini", + "name": "xAI Grok 3 Mini", + "display_name": "xAI Grok 3 Mini", "modalities": { "input": [ "text" @@ -753,45 +682,45 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.29, - "output": 0.43 + "input": 0.3, + "output": 0.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "claude-sonnet-4-6", - "display_name": "claude-sonnet-4-6", + "id": "gpt-5.1-codex-mini", + "name": "OpenAI: GPT-5.1 Codex Mini", + "display_name": "OpenAI: GPT-5.1 Codex Mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -801,43 +730,39 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", + "mode": "effort", + "effort": "none", "effort_options": [ + "none", "low", "medium", "high" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-18", - "last_updated": "2026-03-13", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 3, - "output": 15 + "input": 0.25, + "output": 2, + "cache_read": 0.024999999999999998 }, "type": "chat" }, { - "id": "gpt-5-thinking", - "name": "gpt-5-thinking", - "display_name": "gpt-5-thinking", + "id": "grok-4-1-fast-reasoning", + "name": "xAI Grok 4.1 Fast Reasoning", + "display_name": "xAI Grok 4.1 Fast Reasoning", "modalities": { "input": [ "text", @@ -848,8 +773,8 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, @@ -857,21 +782,27 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "knowledge": "2025-11", + "release_date": "2025-11-17", + "last_updated": "2025-11-17", "cost": { - "input": 1.25, - "output": 10 + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 }, "type": "chat" }, { - "id": "glm-4.7-flashx", - "name": "glm-4.7-flashx", - "display_name": "glm-4.7-flashx", + "id": "kimi-k2-0711", + "name": "Kimi K2 (07/11)", + "display_name": "Kimi K2 (07/11)", "modalities": { "input": [ "text" @@ -881,285 +812,203 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-20", - "last_updated": "2026-01-20", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.0715, - "output": 0.429 + "input": 0.5700000000000001, + "output": 2.3 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "gemini-3-flash-preview", - "display_name": "gemini-3-flash-preview", + "id": "deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 163840, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-12-18", - "last_updated": "2025-12-18", + "knowledge": "2025-09", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 0.5, - "output": 3 + "input": 0.27, + "output": 0.41 }, "type": "chat" }, { - "id": "qwen-plus", - "name": "Qwen-Plus", - "display_name": "Qwen-Plus", + "id": "grok-4-1-fast-non-reasoning", + "name": "xAI Grok 4.1 Fast Non-Reasoning", + "display_name": "xAI Grok 4.1 Fast Non-Reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2025-11", + "release_date": "2025-11-17", + "last_updated": "2025-11-17", "cost": { - "input": 0.12, - "output": 1.2 + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 }, "type": "chat" }, { - "id": "grok-4.20-beta-0309-non-reasoning", - "name": "grok-4.20-beta-0309-non-reasoning", - "display_name": "grok-4.20-beta-0309-non-reasoning", + "id": "qwen2.5-coder-7b-fast", + "name": "Qwen2.5 Coder 7B fast", + "display_name": "Qwen2.5 Coder 7B fast", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 32000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "knowledge": "2024-09", + "release_date": "2024-09-15", + "last_updated": "2024-09-15", "cost": { - "input": 2, - "output": 6 + "input": 0.03, + "output": 0.09 }, "type": "chat" }, { - "id": "claude-opus-4-7", - "name": "claude-opus-4-7", - "display_name": "claude-opus-4-7", + "id": "grok-4", + "name": "xAI Grok 4", + "display_name": "xAI Grok 4", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "knowledge": "2024-07", + "release_date": "2024-07-09", + "last_updated": "2024-07-09", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25, - "context_over_200k": { - "input": 10, - "output": 37.5, - "cache_read": 1, - "cache_write": 12.5 - } + "input": 3, + "output": 15, + "cache_read": 0.75 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "gpt-5-mini", - "display_name": "gpt-5-mini", + "id": "sonar", + "name": "Perplexity Sonar", + "display_name": "Perplexity Sonar", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 127000, + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0.25, - "output": 2 + "input": 1, + "output": 1 }, "type": "chat" }, { - "id": "gemini-3-pro-preview", - "name": "gemini-3-pro-preview", - "display_name": "gemini-3-pro-preview", + "id": "mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text", @@ -1170,47 +1019,29 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 16400 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 2, - "output": 12 + "input": 20, + "output": 40 }, "type": "chat" }, { - "id": "MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "grok-code-fast-1", + "name": "xAI Grok Code Fast 1", + "display_name": "xAI Grok Code Fast 1", "modalities": { "input": [ "text" @@ -1220,8 +1051,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 256000, + "output": 10000 }, "temperature": true, "tool_call": true, @@ -1230,29 +1061,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": false, - "release_date": "2026-03-19", - "last_updated": "2026-03-19", + "knowledge": "2024-08", + "release_date": "2024-08-25", + "last_updated": "2024-08-25", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.19999999999999998, + "output": 1.5, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "qwen3-max-2025-09-23", - "name": "qwen3-max-2025-09-23", - "display_name": "qwen3-max-2025-09-23", + "id": "deepseek-v3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ "text" @@ -1262,8 +1089,8 @@ ] }, "limit": { - "context": 258048, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -1272,54 +1099,20 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-24", - "last_updated": "2025-09-24", - "cost": { - "input": 0.86, - "output": 3.43 - }, - "type": "chat" - }, - { - "id": "claude-sonnet-4-5-20250929", - "name": "claude-sonnet-4-5-20250929", - "display_name": "claude-sonnet-4-5-20250929", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 64000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2024-12", + "release_date": "2024-12-26", + "last_updated": "2024-12-26", "cost": { - "input": 3, - "output": 15 + "input": 0.56, + "output": 1.68, + "cache_read": 0.07 }, "type": "chat" }, { - "id": "qwen-flash", - "name": "Qwen-Flash", - "display_name": "Qwen-Flash", + "id": "gpt-5-codex", + "name": "OpenAI: GPT-5 Codex", + "display_name": "OpenAI: GPT-5 Codex", "modalities": { "input": [ "text" @@ -1329,53 +1122,10 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", - "cost": { - "input": 0.022, - "output": 0.22 - }, - "type": "chat" - }, - { - "id": "gemini-2.5-pro", - "name": "gemini-2.5-pro", - "display_name": "gemini-2.5-pro", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -1385,74 +1135,78 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { "input": 1.25, - "output": 10 + "output": 10, + "cache_read": 0.12500000000000003 }, "type": "chat" }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "grok-4-1-fast-non-reasoning", - "display_name": "grok-4-1-fast-non-reasoning", + "id": "gpt-5.1-chat-latest", + "name": "OpenAI GPT-5.1 Chat", + "display_name": "OpenAI GPT-5.1 Chat", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-11-20", - "last_updated": "2025-11-20", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.2, - "output": 0.5 + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 }, "type": "chat" }, { - "id": "claude-3-5-haiku-latest", - "name": "claude-3-5-haiku-latest", - "display_name": "claude-3-5-haiku-latest", + "id": "claude-4.5-haiku", + "name": "Anthropic: Claude 4.5 Haiku", + "display_name": "Anthropic: Claude 4.5 Haiku", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -1467,21 +1221,23 @@ "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2025-10", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", "cost": { - "input": 0.8, - "output": 4 + "input": 1, + "output": 5, + "cache_read": 0.09999999999999999, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "claude-opus-4-5-20251101-thinking", - "name": "claude-opus-4-5-20251101-thinking", - "display_name": "claude-opus-4-5-20251101-thinking", + "id": "gpt-4.1", + "name": "OpenAI GPT-4.1", + "display_name": "OpenAI GPT-4.1", "modalities": { "input": [ "text", @@ -1492,148 +1248,100 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-11-25", - "last_updated": "2025-11-25", + "knowledge": "2025-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 5, - "output": 25 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "gpt-5.2", - "name": "gpt-5.2", - "display_name": "gpt-5.2", + "id": "glm-4.6", + "name": "Zai GLM-4.6", + "display_name": "Zai GLM-4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-12", - "last_updated": "2025-12-12", + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 1.75, - "output": 14 + "input": 0.44999999999999996, + "output": 1.5 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "gpt-5.4-mini", - "display_name": "gpt-5.4-mini", + "id": "llama-3.3-70b-versatile", + "name": "Meta Llama 3.3 70B Versatile", + "display_name": "Meta Llama 3.3 70B Versatile", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 32678 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-19", - "last_updated": "2026-03-19", + "knowledge": "2024-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.75, - "output": 4.5 + "input": 0.59, + "output": 0.7899999999999999 }, "type": "chat" }, { - "id": "gemini-3-pro-image-preview", - "name": "gemini-3-pro-image-preview", - "display_name": "gemini-3-pro-image-preview", + "id": "claude-opus-4", + "name": "Anthropic: Claude Opus 4", + "display_name": "Anthropic: Claude Opus 4", "modalities": { "input": [ "text", @@ -1644,47 +1352,32 @@ ] }, "limit": { - "context": 32768, - "output": 64000 + "context": 200000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-11-20", - "last_updated": "2025-11-20", + "knowledge": "2025-05", + "release_date": "2025-05-14", + "last_updated": "2025-05-14", "cost": { - "input": 2, - "output": 120 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "glm-5.1", - "name": "glm-5.1", - "display_name": "glm-5.1", + "id": "gpt-oss-20b", + "name": "OpenAI GPT-OSS 20b", + "display_name": "OpenAI GPT-OSS 20b", "modalities": { "input": [ "text" @@ -1694,7 +1387,7 @@ ] }, "limit": { - "context": 200000, + "context": 131072, "output": 131072 }, "temperature": true, @@ -1705,93 +1398,84 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": false, - "release_date": "2026-04-10", - "last_updated": "2026-04-10", + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.86, - "output": 3.5 + "input": 0.049999999999999996, + "output": 0.19999999999999998 }, "type": "chat" }, { - "id": "qwen-max-latest", - "name": "Qwen-Max-Latest", - "display_name": "Qwen-Max-Latest", + "id": "claude-4.5-sonnet", + "name": "Anthropic: Claude Sonnet 4.5", + "display_name": "Anthropic: Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2024-04-03", - "last_updated": "2025-01-25", + "knowledge": "2025-09", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.343, - "output": 1.372 + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gpt-5.4-nano", - "name": "gpt-5.4-nano", - "display_name": "gpt-5.4-nano", + "id": "gpt-5-pro", + "name": "OpenAI: GPT-5 Pro", + "display_name": "OpenAI: GPT-5 Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 32768 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], + "default_enabled": true, + "mode": "fixed", + "effort": "high", "verbosity": "medium", "verbosity_options": [ "low", @@ -1801,197 +1485,166 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-19", - "last_updated": "2026-03-19", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.2, - "output": 1.25 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "gemini-2.5-flash-image", - "name": "gemini-2.5-flash-image", - "display_name": "gemini-2.5-flash-image", + "id": "deepseek-reasoner", + "name": "DeepSeek Reasoner", + "display_name": "DeepSeek Reasoner", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-10-08", - "last_updated": "2025-10-08", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.3, - "output": 30 + "input": 0.56, + "output": 1.68, + "cache_read": 0.07 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "gpt-4.1-mini", + "name": "OpenAI GPT-4.1 Mini", + "display_name": "OpenAI GPT-4.1 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, + "open_weights": false, "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.286, - "output": 1.142 + "input": 0.39999999999999997, + "output": 1.5999999999999999, + "cache_read": 0.09999999999999999 }, "type": "chat" }, { - "id": "gpt-5.4-mini-2026-03-17", - "name": "gpt-5.4-mini-2026-03-17", - "display_name": "gpt-5.4-mini-2026-03-17", + "id": "qwen3-coder", + "name": "Qwen3 Coder 480B A35B Instruct Turbo", + "display_name": "Qwen3 Coder 480B A35B Instruct Turbo", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-19", - "last_updated": "2026-03-19", + "knowledge": "2025-07", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.75, - "output": 4.5 + "input": 0.22, + "output": 0.95 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "gemini-2.5-flash", - "display_name": "gemini-2.5-flash", + "id": "llama-3.1-8b-instruct-turbo", + "name": "Meta Llama 3.1 8B Instruct Turbo", + "display_name": "Meta Llama 3.1 8B Instruct Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2024-07", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.3, - "output": 2.5 + "input": 0.02, + "output": 0.03 }, "type": "chat" }, { - "id": "gpt-5.2-chat-latest", - "name": "gpt-5.2-chat-latest", - "display_name": "gpt-5.2-chat-latest", + "id": "claude-opus-4-1", + "name": "Anthropic: Claude Opus 4.1", + "display_name": "Anthropic: Claude Opus 4.1", "modalities": { "input": [ "text", @@ -2002,30 +1655,37 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-12", - "last_updated": "2025-12-12", + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.75, - "output": 14 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "doubao-seed-1-6-vision-250815", - "name": "doubao-seed-1-6-vision-250815", - "display_name": "doubao-seed-1-6-vision-250815", + "id": "claude-4.5-opus", + "name": "Anthropic: Claude Opus 4.5", + "display_name": "Anthropic: Claude Opus 4.5", "modalities": { "input": [ "text", @@ -2036,178 +1696,231 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2025-11", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.114, - "output": 1.143 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "gemini-3.1-flash-image-preview", - "name": "gemini-3.1-flash-image-preview", - "display_name": "gemini-3.1-flash-image-preview", + "id": "sonar-deep-research", + "name": "Perplexity Sonar Deep Research", + "display_name": "Perplexity Sonar Deep Research", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 127000, + "output": 4096 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2025-01", - "release_date": "2026-02-27", - "last_updated": "2026-02-27", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0.5, - "output": 60 + "input": 2, + "output": 8 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "MiniMax-M2.7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "gemini-2.5-flash-lite", + "name": "Google Gemini 2.5 Flash Lite", + "display_name": "Google Gemini 2.5 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": false, "open_weights": false, - "release_date": "2026-03-19", - "last_updated": "2026-03-19", + "knowledge": "2025-07", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", "cost": { - "input": 0.6, - "output": 4.8 + "input": 0.09999999999999999, + "output": 0.39999999999999997, + "cache_read": 0.024999999999999998, + "cache_write": 0.09999999999999999 }, "type": "chat" }, { - "id": "glm-4.5-x", - "name": "glm-4.5-x", - "display_name": "glm-4.5-x", + "id": "gemini-3-pro-preview", + "name": "Google Gemini 3 Pro Preview", + "display_name": "Google Gemini 3 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "knowledge": "2025-11", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 1.143, - "output": 2.29 + "input": 2, + "output": 12, + "cache_read": 0.19999999999999998 }, "type": "chat" }, { - "id": "MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "gpt-5.1", + "name": "OpenAI GPT-5.1", + "display_name": "OpenAI GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, "open_weights": false, - "release_date": "2025-12-19", - "last_updated": "2025-12-19", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.3, - "output": 1.2 + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "gpt-5.1", - "display_name": "gpt-5.1", + "id": "gpt-5-nano", + "name": "OpenAI GPT-5 Nano", + "display_name": "OpenAI GPT-5 Nano", "modalities": { "input": [ "text", @@ -2225,16 +1938,16 @@ "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", + "minimal", "low", "medium", "high" @@ -2248,54 +1961,56 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.25, - "output": 10 + "input": 0.049999999999999996, + "output": 0.39999999999999997, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "kimi-k2-thinking-turbo", - "name": "kimi-k2-thinking-turbo", - "display_name": "kimi-k2-thinking-turbo", + "id": "gpt-4o-mini", + "name": "OpenAI GPT-4o-mini", + "display_name": "OpenAI GPT-4o-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 1.265, - "output": 9.119 + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "deepseek-reasoner", - "name": "Deepseek-Reasoner", - "display_name": "Deepseek-Reasoner", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ "text" @@ -2305,8 +2020,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 40960 }, "temperature": true, "tool_call": true, @@ -2327,58 +2042,62 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { "input": 0.29, - "output": 0.43 + "output": 0.59 }, "type": "chat" }, { - "id": "grok-4-fast-reasoning", - "name": "grok-4-fast-reasoning", - "display_name": "grok-4-fast-reasoning", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 256000, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "knowledge": "2025-11", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.48, + "output": 2 }, "type": "chat" }, { - "id": "claude-opus-4-1-20250805-thinking", - "name": "claude-opus-4-1-20250805-thinking", - "display_name": "claude-opus-4-1-20250805-thinking", + "id": "llama-4-scout", + "name": "Meta Llama 4 Scout 17B 16E", + "display_name": "Meta Llama 4 Scout 17B 16E", "modalities": { "input": [ "text", @@ -2389,36 +2108,29 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-05-27", - "last_updated": "2025-05-27", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 15, - "output": 75 + "input": 0.08, + "output": 0.3 }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "glm-4.5-air", - "display_name": "glm-4.5-air", + "id": "llama-prompt-guard-2-86m", + "name": "Meta Llama Prompt Guard 2 86M", + "display_name": "Meta Llama Prompt Guard 2 86M", "modalities": { "input": [ "text" @@ -2428,30 +2140,29 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 512, + "output": 2 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 0.1143, - "output": 0.286 + "input": 0.01, + "output": 0.01 }, "type": "chat" }, { - "id": "gpt-5.4-pro", - "name": "gpt-5.4-pro", - "display_name": "gpt-5.4-pro", + "id": "claude-sonnet-4-5-20250929", + "name": "Anthropic: Claude Sonnet 4.5 (20250929)", + "display_name": "Anthropic: Claude Sonnet 4.5 (20250929)", "modalities": { "input": [ "text", @@ -2462,59 +2173,36 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2025-09", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 30, - "output": 180, - "cache_read": 0, - "cache_write": 0, - "context_over_200k": { - "input": 60, - "output": 270 - } + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "glm-5-turbo", - "name": "glm-5-turbo", - "display_name": "glm-5-turbo", + "id": "claude-3.5-sonnet-v2", + "name": "Anthropic: Claude 3.5 Sonnet v2", + "display_name": "Anthropic: Claude 3.5 Sonnet v2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -2522,50 +2210,42 @@ }, "limit": { "context": 200000, - "output": 131072 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "knowledge": "2024-10", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.72, - "output": 3.2 + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 }, "type": "chat" }, { "id": "qwen3-30b-a3b", - "name": "Qwen3-30B-A3B", - "display_name": "Qwen3-30B-A3B", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 41000, + "output": 41000 }, "temperature": true, "tool_call": true, @@ -2585,24 +2265,22 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "knowledge": "2025-06", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 0.11, - "output": 1.08 + "input": 0.08, + "output": 0.29 }, "type": "chat" }, { - "id": "claude-opus-4-5", - "name": "claude-opus-4-5", - "display_name": "claude-opus-4-5", + "id": "o1", + "name": "OpenAI: o1", + "display_name": "OpenAI: o1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -2610,69 +2288,77 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 100000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-25", - "last_updated": "2025-11-25", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 5, - "output": 25 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "glm-4.5v", - "name": "GLM-4.5V", - "display_name": "GLM-4.5V", + "id": "ernie-4.5-21b-a3b-thinking", + "name": "Baidu Ernie 4.5 21B A3B Thinking", + "display_name": "Baidu Ernie 4.5 21B A3B Thinking", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 128000, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-12", - "last_updated": "2025-08-12", + "attachment": false, + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-03-16", + "last_updated": "2025-03-16", "cost": { - "input": 0.29, - "output": 0.86 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "glm-4.6", - "name": "glm-4.6", - "display_name": "glm-4.6", + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ "text" @@ -2682,8 +2368,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -2697,33 +2383,32 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.286, - "output": 1.142 + "input": 0.03, + "output": 0.13 }, "type": "chat" }, { - "id": "claude-opus-4-6-thinking", - "name": "claude-opus-4-6-thinking", - "display_name": "claude-opus-4-6-thinking", + "id": "claude-sonnet-4", + "name": "Anthropic: Claude Sonnet 4", + "display_name": "Anthropic: Claude Sonnet 4", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -2731,267 +2416,181 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2025-05", - "release_date": "2026-02-06", - "last_updated": "2026-03-13", + "release_date": "2025-05-14", + "last_updated": "2025-05-14", "cost": { - "input": 5, - "output": 25 + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-09-2025", - "name": "gemini-2.5-flash-preview-09-2025", - "display_name": "gemini-2.5-flash-preview-09-2025", + "id": "sonar-reasoning-pro", + "name": "Perplexity Sonar Reasoning Pro", + "display_name": "Perplexity Sonar Reasoning Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 127000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-09-26", - "last_updated": "2025-09-26", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0.3, - "output": 2.5 + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "claude-sonnet-4-6-thinking", - "name": "claude-sonnet-4-6-thinking", - "display_name": "claude-sonnet-4-6-thinking", + "id": "deepseek-tng-r1t2-chimera", + "name": "DeepSeek TNG R1T2 Chimera", + "display_name": "DeepSeek TNG R1T2 Chimera", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 130000, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08", - "release_date": "2026-02-18", - "last_updated": "2026-03-13", + "knowledge": "2025-07", + "release_date": "2025-07-02", + "last_updated": "2025-07-02", "cost": { - "input": 3, - "output": 15 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "glm-4.6v", - "name": "GLM-4.6V", - "display_name": "GLM-4.6V", + "id": "gpt-4.1-nano", + "name": "OpenAI GPT-4.1 Nano", + "display_name": "OpenAI GPT-4.1 Nano", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 1047576, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": true, + "attachment": false, + "open_weights": false, "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.145, - "output": 0.43 + "input": 0.09999999999999999, + "output": 0.39999999999999997, + "cache_read": 0.024999999999999998 }, "type": "chat" }, { - "id": "claude-opus-4-1-20250805", - "name": "claude-opus-4-1-20250805", - "display_name": "claude-opus-4-1-20250805", + "id": "gemma-3-12b-it", + "name": "Google Gemma 3 12B", + "display_name": "Google Gemma 3 12B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 15, - "output": 75 + "input": 0.049999999999999996, + "output": 0.09999999999999999 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "gpt-5.4", - "display_name": "gpt-5.4", + "id": "o4-mini", + "name": "OpenAI o4 Mini", + "display_name": "OpenAI o4 Mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -2999,74 +2598,91 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "cache_write": 0, - "context_over_200k": { - "input": 5, - "output": 22.5 - } + "input": 1.1, + "output": 4.4, + "cache_read": 0.275 }, "type": "chat" }, { - "id": "gpt-5.1-chat-latest", - "name": "gpt-5.1-chat-latest", - "display_name": "gpt-5.1-chat-latest", + "id": "gpt-5.1-codex", + "name": "OpenAI: GPT-5.1 Codex", + "display_name": "OpenAI: GPT-5.1 Codex", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { "input": 1.25, - "output": 10 + "output": 10, + "cache_read": 0.12500000000000003 }, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "claude-haiku-4-5-20251001", - "display_name": "claude-haiku-4-5-20251001", + "id": "gemini-2.5-flash", + "name": "Google Gemini 2.5 Flash", + "display_name": "Google Gemini 2.5 Flash", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -3074,86 +2690,124 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-16", - "last_updated": "2025-10-16", + "knowledge": "2025-06", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 1, - "output": 5 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "MiniMax-M1", - "name": "MiniMax-M1", - "display_name": "MiniMax-M1", + "id": "gpt-5-mini", + "name": "OpenAI GPT-5 Mini", + "display_name": "OpenAI GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2025-06-16", - "last_updated": "2025-06-16", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.132, - "output": 1.254 + "input": 0.25, + "output": 2, + "cache_read": 0.024999999999999998 }, "type": "chat" }, { - "id": "gpt-5.4-nano-2026-03-17", - "name": "gpt-5.4-nano-2026-03-17", - "display_name": "gpt-5.4-nano-2026-03-17", + "id": "o3-mini", + "name": "OpenAI o3 Mini", + "display_name": "OpenAI o3 Mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -3161,56 +2815,55 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-19", - "last_updated": "2026-03-19", + "knowledge": "2023-10", + "release_date": "2023-10-01", + "last_updated": "2023-10-01", "cost": { - "input": 0.2, - "output": 1.25 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "claude-sonnet-4-20250514", - "name": "claude-sonnet-4-20250514", - "display_name": "claude-sonnet-4-20250514", + "id": "llama-4-maverick", + "name": "Meta Llama 4 Maverick 17B 128E", + "display_name": "Meta Llama 4 Maverick 17B 128E", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 3, - "output": 15 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "qwen3-coder-480b-a35b-instruct", - "display_name": "qwen3-coder-480b-a35b-instruct", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ "text" @@ -3221,7 +2874,7 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 262144 }, "temperature": true, "tool_call": true, @@ -3230,112 +2883,85 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "knowledge": "2025-07", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "cost": { - "input": 0.86, - "output": 3.43 + "input": 0.09999999999999999, + "output": 0.3 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "claude-opus-4-6", - "display_name": "claude-opus-4-6", + "id": "llama-3.3-70b-instruct", + "name": "Meta Llama 3.3 70B Instruct", + "display_name": "Meta Llama 3.3 70B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 128000, + "output": 16400 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-06", - "last_updated": "2026-03-13", + "knowledge": "2024-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 5, - "output": 25 + "input": 0.13, + "output": 0.39 }, "type": "chat" }, { - "id": "doubao-seed-code-preview-251028", - "name": "doubao-seed-code-preview-251028", - "display_name": "doubao-seed-code-preview-251028", + "id": "qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 262000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-11", - "last_updated": "2025-11-11", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.17, - "output": 1.14 + "input": 0.14, + "output": 1.4 }, "type": "chat" }, { - "id": "gpt-4.1-nano", - "name": "gpt-4.1-nano", - "display_name": "gpt-4.1-nano", + "id": "claude-3.5-haiku", + "name": "Anthropic: Claude 3.5 Haiku", + "display_name": "Anthropic: Claude 3.5 Haiku", "modalities": { "input": [ "text", @@ -3346,29 +2972,31 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-10", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.7999999999999999, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "deepseek-v3.2", - "display_name": "deepseek-v3.2", + "id": "gpt-oss-120b", + "name": "OpenAI GPT-OSS 120b", + "display_name": "OpenAI GPT-OSS 120b", "modalities": { "input": [ "text" @@ -3378,13 +3006,14 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -3393,34 +3022,35 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.29, - "output": 0.43 + "input": 0.04, + "output": 0.16 }, "type": "chat" }, { - "id": "gpt-5-pro", - "name": "gpt-5-pro", - "display_name": "gpt-5-pro", + "id": "qwen3-235b-a22b-thinking", + "name": "Qwen3 235B A22B Thinking", + "display_name": "Qwen3 235B A22B Thinking", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 272000 + "context": 262144, + "output": 81920 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -3428,72 +3058,65 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-08", - "last_updated": "2025-10-08", + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 15, - "output": 120 + "input": 0.3, + "output": 2.9000000000000004 }, "type": "chat" }, { - "id": "gpt-4o", - "name": "gpt-4o", - "display_name": "gpt-4o", + "id": "hermes-2-pro-llama-3-8b", + "name": "Hermes 2 Pro Llama 3 8B", + "display_name": "Hermes 2 Pro Llama 3 8B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "knowledge": "2024-05", + "release_date": "2024-05-27", + "last_updated": "2024-05-27", "cost": { - "input": 2.5, - "output": 10 + "input": 0.14, + "output": 0.14 }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "claude-sonnet-4-5", - "display_name": "claude-sonnet-4-5", + "id": "o3", + "name": "OpenAI o3", + "display_name": "OpenAI o3", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -3501,9 +3124,9 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -3511,39 +3134,48 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 3, - "output": 15 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "gpt-5", - "name": "gpt-5", - "display_name": "gpt-5", + "id": "o1-mini", + "name": "OpenAI: o1-mini", + "display_name": "OpenAI: o1-mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 65536 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -3555,13 +3187,6 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -3569,139 +3194,102 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.25, - "output": 10 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "grok-4.20-beta-0309-reasoning", - "name": "grok-4.20-beta-0309-reasoning", - "display_name": "grok-4.20-beta-0309-reasoning", + "id": "grok-3", + "name": "xAI Grok 3", + "display_name": "xAI Grok 3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 2, - "output": 6 + "input": 3, + "output": 15, + "cache_read": 0.75 }, "type": "chat" }, { - "id": "claude-opus-4-20250514", - "name": "claude-opus-4-20250514", - "display_name": "claude-opus-4-20250514", + "id": "grok-4-fast-non-reasoning", + "name": "xAI Grok 4 Fast Non-Reasoning", + "display_name": "xAI Grok 4 Fast Non-Reasoning", "modalities": { "input": [ "text", "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 32000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 15, - "output": 75 - }, - "type": "chat" - }, - { - "id": "glm-for-coding", - "name": "glm-for-coding", - "display_name": "glm-for-coding", - "modalities": { - "input": [ - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2025-09", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 0.086, - "output": 0.343 + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929-thinking", - "name": "claude-sonnet-4-5-20250929-thinking", - "display_name": "claude-sonnet-4-5-20250929-thinking", + "id": "grok-4-fast-reasoning", + "name": "xAI: Grok 4 Fast Reasoning", + "display_name": "xAI: Grok 4 Fast Reasoning", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, @@ -3711,25 +3299,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2025-09", + "release_date": "2025-09-01", + "last_updated": "2025-09-01", "cost": { - "input": 3, - "output": 15 + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 }, "type": "chat" }, { - "id": "glm-4.5-airx", - "name": "glm-4.5-airx", - "display_name": "glm-4.5-airx", + "id": "sonar-pro", + "name": "Perplexity Sonar Pro", + "display_name": "Perplexity Sonar Pro", "modalities": { "input": [ "text" @@ -3739,76 +3327,75 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0.572, - "output": 1.714 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "gpt-4.1", - "display_name": "gpt-4.1", + "id": "llama-3.1-8b-instruct", + "name": "Meta Llama 3.1 8B Instruct", + "display_name": "Meta Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 16384, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-07", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 2, - "output": 8 + "input": 0.02, + "output": 0.049999999999999996 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "kimi-k2-thinking", - "display_name": "kimi-k2-thinking", + "id": "gpt-5", + "name": "OpenAI GPT-5", + "display_name": "OpenAI GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -3817,29 +3404,40 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.575, - "output": 2.3 + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 }, "type": "chat" }, { - "id": "gemini-2.0-flash-lite", - "name": "gemini-2.0-flash-lite", - "display_name": "gemini-2.0-flash-lite", + "id": "llama-guard-4", + "name": "Meta Llama Guard 4 12B", + "display_name": "Meta Llama Guard 4 12B", "modalities": { "input": [ "text", @@ -3850,171 +3448,118 @@ ] }, "limit": { - "context": 2000000, - "output": 8192 + "context": 131072, + "output": 1024 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-06-16", - "last_updated": "2025-06-16", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.075, - "output": 0.3 + "input": 0.21, + "output": 0.21 }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "gpt-4.1-mini", - "display_name": "gpt-4.1-mini", + "id": "deepseek-v3.1-terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ - "text", - "image", - "pdf" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 1047576, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 0.4, - "output": 1.6 - }, - "type": "chat" - }, - { - "id": "grok-4-fast-non-reasoning", - "name": "grok-4-fast-non-reasoning", - "display_name": "grok-4-fast-non-reasoning", - "modalities": { - "input": [ - "text", - "image" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "knowledge": "2025-09", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.27, + "output": 1, + "cache_read": 0.21600000000000003 }, "type": "chat" - }, + } + ] + }, + "auriko": { + "id": "auriko", + "name": "Auriko", + "display_name": "Auriko", + "api": "https://api.auriko.ai/v1", + "doc": "https://docs.auriko.ai", + "models": [ { - "id": "doubao-seed-1-6-thinking-250715", - "name": "doubao-seed-1-6-thinking-250715", - "display_name": "doubao-seed-1-6-thinking-250715", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16000 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-07-15", - "last_updated": "2025-07-15", - "cost": { - "input": 0.121, - "output": 1.21 - }, - "type": "chat" - }, - { - "id": "ministral-14b-2512", - "name": "ministral-14b-2512", - "display_name": "ministral-14b-2512", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 128000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.33, - "output": 0.33 + "input": 0.5, + "output": 2.8 }, "type": "chat" - } - ] - }, - "alibaba": { - "id": "alibaba", - "name": "alibaba", - "display_name": "alibaba", - "api": "https://dashscope-intl.aliyuncs.com/compatible-mode/v1", - "doc": "https://www.alibabacloud.com/help/en/model-studio/models", - "models": [ + }, { - "id": "qwen3-235b-a22b", - "name": "Qwen3 235B A22B", - "display_name": "Qwen3 235B A22B", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -4024,19 +3569,14 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -4050,34 +3590,34 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.7, - "output": 2.8, - "reasoning": 8.4 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "qwen3.5-122b-a10b", - "name": "Qwen3.5 122B-A10B", - "display_name": "Qwen3.5 122B-A10B", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", "image", + "audio", "video", - "audio" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1048576, "output": 65536 }, "temperature": true, @@ -4089,28 +3629,54 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-23", - "last_updated": "2026-02-23", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.4, - "output": 3.2 + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + }, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -4121,42 +3687,52 @@ }, "limit": { "context": 1000000, - "output": 65536 + "output": 384000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 1, - "output": 5 + "input": 0.435, + "output": 0.87, + "cache_read": 0.003625 }, "type": "chat" }, { - "id": "qwen3.6-27b", - "name": "Qwen3.6 27B", - "display_name": "Qwen3.6 27B", + "id": "minimax-m2-7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -4164,211 +3740,210 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.6, - "output": 3.6 + "input": 0.3, + "output": 1.2, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "qwen3.5-27b", - "name": "Qwen3.5 27B", - "display_name": "Qwen3.5 27B", + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", "image", - "video", - "audio" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-23", - "last_updated": "2026-02-23", - "cost": { - "input": 0.3, - "output": 2.4 - }, - "type": "chat" - }, - { - "id": "qwen-vl-ocr", - "name": "Qwen Vl Ocr", - "display_name": "Qwen Vl Ocr", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 34096, - "output": 4096 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-10-28", - "last_updated": "2025-04-13", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.72, - "output": 0.72 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "qwen-omni-turbo-realtime", - "name": "Qwen-Omni Turbo Realtime", - "display_name": "Qwen-Omni Turbo Realtime", + "id": "qwen-3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ "text", "image", - "audio" + "video" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-08", - "last_updated": "2025-05-08", + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.27, - "output": 1.07, - "input_audio": 4.44, - "output_audio": 8.89 + "input": 0.5, + "output": 3, + "cache_read": 0.1, + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5 + }, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5, + "tier": { + "type": "context", + "size": 256000 + } + } + ] }, "type": "chat" }, { - "id": "qwen3-8b", - "name": "Qwen3 8B", - "display_name": "Qwen3 8B", + "id": "claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], "interleaved": true, "summaries": true, - "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.18, - "output": 0.7, - "reasoning": 2.1 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "qwen3.5-397b-a17b", - "name": "Qwen3.5 397B-A17B", - "display_name": "Qwen3.5 397B-A17B", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -4387,75 +3962,93 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-02-15", - "last_updated": "2026-02-15", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.6, - "output": 3.6 + "input": 0.14, + "output": 0.28, + "cache_read": 0.0028 }, "type": "chat" }, { - "id": "qwq-plus", - "name": "QwQ Plus", - "display_name": "QwQ Plus", + "id": "gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 32768, - "min": 0, - "max": 32768 - } + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-03-05", - "last_updated": "2025-03-05", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.8, - "output": 2.4 + "input": 2, + "output": 12, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "qwen-vl-plus", - "name": "Qwen-VL Plus", - "display_name": "Qwen-VL Plus", + "id": "grok-4.3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ "text", @@ -4466,117 +4059,172 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", - "last_updated": "2025-08-15", + "release_date": "2026-05-01", + "last_updated": "2026-05-01", "cost": { - "input": 0.21, - "output": 0.63 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2, + "context_over_200k": { + "input": 2.5, + "output": 5, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 2.5, + "output": 5, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "qwen3-livetranslate-flash-realtime", - "name": "Qwen3-LiveTranslate Flash Realtime", - "display_name": "Qwen3-LiveTranslate Flash Realtime", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", "audio", - "video" + "video", + "pdf" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 53248, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 10, - "output": 10, - "input_audio": 10, - "output_audio": 38 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.7, - "output": 2.8, - "reasoning": 8.4 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "qwen-max", - "name": "Qwen Max", - "display_name": "Qwen Max", + "id": "minimax-m2-7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ "text" @@ -4586,57 +4234,49 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "search": { "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-04-03", - "last_updated": "2025-01-25", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1.6, - "output": 6.4 + "input": 0.6, + "output": 2.4, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "qwen-plus", - "name": "Qwen Plus", - "display_name": "Qwen Plus", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -4649,42 +4289,43 @@ ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", - "last_updated": "2025-09-11", + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.4, - "output": 1.2, - "reasoning": 4 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" - }, + } + ] + }, + "firepass": { + "id": "firepass", + "name": "Fireworks (Firepass)", + "display_name": "Fireworks (Firepass)", + "api": "https://api.fireworks.ai/inference/v1/", + "doc": "https://docs.fireworks.ai/firepass", + "models": [ { - "id": "qwen3.6-35b-a3b", - "name": "Qwen3.6 35B-A3B", - "display_name": "Qwen3.6 35B-A3B", + "id": "accounts/fireworks/routers/kimi-k2p6-turbo", + "name": "Kimi K2.6 Turbo", + "display_name": "Kimi K2.6 Turbo", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -4703,58 +4344,60 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, "release_date": "2026-04-17", "last_updated": "2026-04-17", "cost": { - "input": 0.248, - "output": 1.485 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" - }, + } + ] + }, + "nano-gpt": { + "id": "nano-gpt", + "name": "NanoGPT", + "display_name": "NanoGPT", + "api": "https://nano-gpt.com/api/v1", + "doc": "https://docs.nano-gpt.com", + "models": [ { - "id": "qwen-omni-turbo", - "name": "Qwen-Omni Turbo", - "display_name": "Qwen-Omni Turbo", + "id": "glm-zero-preview", + "name": "GLM Zero Preview", + "display_name": "GLM Zero Preview", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 8000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-19", - "last_updated": "2025-03-26", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.07, - "output": 0.27, - "input_audio": 4.44, - "output_audio": 8.89 + "input": 1.802, + "output": 1.802 }, "type": "chat" }, { - "id": "qwen-flash", - "name": "Qwen Flash", - "display_name": "Qwen Flash", + "id": "qwen3-30b-a3b-instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ "text" @@ -4764,100 +4407,71 @@ ] }, "limit": { - "context": 1000000, + "context": 256000, "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-02-20", + "last_updated": "2025-02-20", "cost": { - "input": 0.05, - "output": 0.4 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "qwen2-5-vl-7b-instruct", - "name": "Qwen2.5-VL 7B Instruct", - "display_name": "Qwen2.5-VL 7B Instruct", + "id": "hunyuan-t1-latest", + "name": "Hunyuan T1", + "display_name": "Hunyuan T1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "open_weights": false, + "release_date": "2025-03-22", + "last_updated": "2025-03-22", "cost": { - "input": 0.35, - "output": 1.05 + "input": 0.17, + "output": 0.66 }, "type": "chat" }, { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "claude-opus-4-thinking:32000", + "name": "Claude 4 Opus Thinking (32K)", + "display_name": "Claude 4 Opus Thinking (32K)", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 200000, + "output": 32000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -4866,31 +4480,23 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.276, - "output": 1.651, - "cache_read": 0.028, - "cache_write": 0.344 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "Llama-3.3-70B-GeneticLemonade-Opus", + "name": "Llama 3.3 70B GeneticLemonade Opus", + "display_name": "Llama 3.3 70B GeneticLemonade Opus", "modalities": { "input": [ "text" @@ -4900,90 +4506,59 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 1.2, - "output": 6 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "qwen3-omni-flash", - "name": "Qwen3-Omni Flash", - "display_name": "Qwen3-Omni Flash", + "id": "claude-opus-4-1-20250805", + "name": "Claude 4.1 Opus", + "display_name": "Claude 4.1 Opus", "modalities": { "input": [ "text", "image", - "audio", - "video" + "pdf" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 200000, + "output": 32000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.43, - "output": 1.66, - "input_audio": 3.81, - "output_audio": 15.11 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "qwen2-5-72b-instruct", - "name": "Qwen2.5 72B Instruct", - "display_name": "Qwen2.5 72B Instruct", + "id": "command-a-reasoning-08-2025", + "name": "Cohere Command A (08/2025)", + "display_name": "Cohere Command A (08/2025)", "modalities": { "input": [ "text" @@ -4993,107 +4568,87 @@ ] }, "limit": { - "context": 131072, + "context": 256000, "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "open_weights": false, + "release_date": "2025-08-22", + "last_updated": "2025-08-22", "cost": { - "input": 1.4, - "output": 5.6 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b", - "name": "Qwen3-VL 235B-A22B", - "display_name": "Qwen3-VL 235B-A22B", + "id": "Llama-3.3-70B-Magnum-v4-SE", + "name": "Llama 3.3 70B Magnum v4 SE", + "display_name": "Llama 3.3 70B Magnum v4 SE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.7, - "output": 2.8, - "reasoning": 8.4 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "qwen3-asr-flash", - "name": "Qwen3-ASR Flash", - "display_name": "Qwen3-ASR Flash", + "id": "Llama-3.3-70B-The-Omega-Directive-Unslop-v2.1", + "name": "Llama 3.3 70B Omega Directive Unslop v2.1", + "display_name": "Llama 3.3 70B Omega Directive Unslop v2.1", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 53248, - "output": 4096 + "context": 32768, + "output": 16384 }, - "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-08", - "last_updated": "2025-09-08", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.035, - "output": 0.035 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "Llama-3.3-70B-StrawberryLemonade-v1.0", + "name": "Llama 3.3 70B StrawberryLemonade v1.0", + "display_name": "Llama 3.3 70B StrawberryLemonade v1.0", "modalities": { "input": [ "text" @@ -5103,56 +4658,37 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 32768, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.5, - "output": 6 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "qwen-mt-plus", - "name": "Qwen Mt Plus", - "display_name": "Qwen Mt Plus", + "id": "hidream", + "name": "Hidream", + "display_name": "Hidream", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 16384, + "context": 8192, "output": 8192 }, "temperature": true, @@ -5160,21 +4696,16 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01", - "last_updated": "2025-01", - "cost": { - "input": 2.46, - "output": 7.37 - }, + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "type": "chat" }, { - "id": "qwen-vl-max", - "name": "Qwen-VL Max", - "display_name": "Qwen-VL Max", + "id": "glm-4.1v-thinking-flashx", + "name": "GLM 4.1V Thinking FlashX", + "display_name": "GLM 4.1V Thinking FlashX", "modalities": { "input": [ "text", @@ -5185,61 +4716,79 @@ ] }, "limit": { - "context": 131072, + "context": 64000, "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-04-08", - "last_updated": "2025-08-13", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.8, - "output": 3.2 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen3-coder-flash", - "name": "Qwen3 Coder Flash", - "display_name": "Qwen3 Coder Flash", + "id": "gemini-2.5-flash-preview-04-17:thinking", + "name": "Gemini 2.5 Flash Preview Thinking", + "display_name": "Gemini 2.5 Flash Preview Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 1048756, "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-04-17", + "last_updated": "2025-04-17", "cost": { - "input": 0.3, - "output": 1.5 + "input": 0.15, + "output": 3.5 }, "type": "chat" }, { - "id": "qwen2-5-7b-instruct", - "name": "Qwen2.5 7B Instruct", - "display_name": "Qwen2.5 7B Instruct", + "id": "auto-model-premium", + "name": "Auto model (Premium)", + "display_name": "Auto model (Premium)", "modalities": { "input": [ "text" @@ -5249,29 +4798,27 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 1000000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "open_weights": false, + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.175, - "output": 0.7 + "input": 9.996, + "output": 19.992 }, "type": "chat" }, { - "id": "qwen2-5-14b-instruct", - "name": "Qwen2.5 14B Instruct", - "display_name": "Qwen2.5 14B Instruct", + "id": "jamba-large-1.6", + "name": "Jamba Large 1.6", + "display_name": "Jamba Large 1.6", "modalities": { "input": [ "text" @@ -5281,61 +4828,58 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "open_weights": false, + "release_date": "2025-03-12", + "last_updated": "2025-03-12", "cost": { - "input": 0.35, - "output": 1.4 + "input": 1.989, + "output": 7.99 }, "type": "chat" }, { - "id": "qwen2-5-32b-instruct", - "name": "Qwen2.5 32B Instruct", - "display_name": "Qwen2.5 32B Instruct", + "id": "gemini-exp-1206", + "name": "Gemini 2.0 Pro 1206", + "display_name": "Gemini 2.0 Pro 1206", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 2097152, "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "attachment": true, + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.7, - "output": 2.8 + "input": 1.258, + "output": 4.998 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "Gemma-3-27B-CardProjector-v4", + "name": "Gemma 3 27B CardProjector v4", + "display_name": "Gemma 3 27B CardProjector v4", "modalities": { "input": [ "text" @@ -5345,196 +4889,203 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", + "open_weights": false, + "release_date": "2025-03-10", + "last_updated": "2025-03-10", "cost": { - "input": 0.5, - "output": 2 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "qwen-plus-character-ja", - "name": "Qwen Plus Character (Japanese)", - "display_name": "Qwen Plus Character (Japanese)", + "id": "gemini-3-pro-image-preview", + "name": "Gemini 3 Pro Image", + "display_name": "Gemini 3 Pro Image", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 512 + "context": 1048756, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01", - "last_updated": "2024-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.5, - "output": 1.4 + "input": 2, + "output": 12 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "qwen3-omni-flash-realtime", - "name": "Qwen3-Omni Flash Realtime", - "display_name": "Qwen3-Omni Flash Realtime", + "id": "claude-3-7-sonnet-thinking:8192", + "name": "Claude 3.7 Sonnet Thinking (8K)", + "display_name": "Claude 3.7 Sonnet Thinking (8K)", "modalities": { "input": [ "text", "image", - "audio", - "video" + "pdf" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 200000, + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 0.52, - "output": 1.99, - "input_audio": 4.57, - "output_audio": 18.13 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "qwen3-vl-30b-a3b", - "name": "Qwen3-VL 30B-A3B", - "display_name": "Qwen3-VL 30B-A3B", + "id": "doubao-seed-2-0-lite-260215", + "name": "Doubao Seed 2.0 Lite", + "display_name": "Doubao Seed 2.0 Lite", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 256000, + "output": 32000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "cost": { - "input": 0.2, - "output": 0.8, - "reasoning": 2.4 + "input": 0.1462, + "output": 0.8738 }, "type": "chat" }, { - "id": "qwen3-vl-plus", - "name": "Qwen3 VL Plus", - "display_name": "Qwen3 VL Plus", + "id": "claude-sonnet-4-thinking:32768", + "name": "Claude 4 Sonnet Thinking (32K)", + "display_name": "Claude 4 Sonnet Thinking (32K)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 1000000, + "output": 64000 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.2, - "output": 1.6, - "reasoning": 4.8 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "Qwen3-Coder 480B-A35B Instruct", - "display_name": "Qwen3-Coder 480B-A35B Instruct", + "id": "doubao-seed-2-0-pro-260215", + "name": "Doubao Seed 2.0 Pro", + "display_name": "Doubao Seed 2.0 Pro", "modalities": { "input": [ "text" @@ -5544,29 +5095,27 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 256000, + "output": 128000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "cost": { - "input": 1.5, - "output": 7.5 + "input": 0.782, + "output": 3.876 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3-Coder 30B-A3B Instruct", - "display_name": "Qwen3-Coder 30B-A3B Instruct", + "id": "Llama-3.3-70B-Progenitor-V3.3", + "name": "Llama 3.3 70B Progenitor V3.3", + "display_name": "Llama 3.3 70B Progenitor V3.3", "modalities": { "input": [ "text" @@ -5576,251 +5125,204 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 0.45, - "output": 2.25 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "qwen-turbo", - "name": "Qwen Turbo", - "display_name": "Qwen Turbo", + "id": "gemini-2.5-pro-exp-03-25", + "name": "Gemini 2.5 Pro Experimental 0325", + "display_name": "Gemini 2.5 Pro Experimental 0325", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1048756, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-11-01", - "last_updated": "2025-04-28", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0.05, - "output": 0.2, - "reasoning": 0.5 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "qwen-mt-turbo", - "name": "Qwen Mt Turbo", - "display_name": "Qwen Mt Turbo", + "id": "ernie-4.5-turbo-vl-32k", + "name": "Ernie 4.5 Turbo VL 32k", + "display_name": "Ernie 4.5 Turbo VL 32k", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 32000, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01", - "last_updated": "2025-01", + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "cost": { - "input": 0.16, - "output": 0.49 + "input": 0.495, + "output": 1.43 }, "type": "chat" }, { - "id": "qwen3.6-max-preview", - "name": "Qwen3.6 Max Preview", - "display_name": "Qwen3.6 Max Preview", + "id": "deepseek-chat", + "name": "DeepSeek V3/Deepseek Chat", + "display_name": "DeepSeek V3/Deepseek Chat", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-20", - "last_updated": "2026-04-20", + "release_date": "2025-02-27", + "last_updated": "2025-02-27", "cost": { - "input": 1.3, - "output": 7.8, - "cache_read": 0.13, - "cache_write": 1.625 + "input": 0.25, + "output": 0.7 }, "type": "chat" }, { - "id": "qwen2-5-omni-7b", - "name": "Qwen2.5-Omni 7B", - "display_name": "Qwen2.5-Omni 7B", + "id": "step-3", + "name": "Step-3", + "display_name": "Step-3", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 65536, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-12", - "last_updated": "2024-12", + "attachment": true, + "open_weights": false, + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "cost": { - "input": 0.1, - "output": 0.4, - "input_audio": 6.76 + "input": 0.2499, + "output": 0.6494 }, "type": "chat" }, { - "id": "qwen3.5-plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "Llama-3.3-70B-RAWMAW", + "name": "Llama 3.3 70B RAWMAW", + "display_name": "Llama 3.3 70B RAWMAW", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.4, - "output": 2.4, - "reasoning": 2.4 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "qwen2-5-vl-72b-instruct", - "name": "Qwen2.5-VL 72B Instruct", - "display_name": "Qwen2.5-VL 72B Instruct", + "id": "GLM-4.5-Air-Derestricted-Iceblink-v2-ReExtract", + "name": "GLM 4.5 Air Derestricted Iceblink v2 ReExtract", + "display_name": "GLM 4.5 Air Derestricted Iceblink v2 ReExtract", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -5828,62 +5330,56 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "open_weights": false, + "release_date": "2025-12-12", + "last_updated": "2025-12-12", "cost": { - "input": 2.8, - "output": 8.4 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "qvq-max", - "name": "QVQ Max", - "display_name": "QVQ Max", + "id": "universal-summarizer", + "name": "Universal Summarizer", + "display_name": "Universal Summarizer", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32768, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "release_date": "2023-05-01", + "last_updated": "2024-01-01", "cost": { - "input": 1.2, - "output": 4.8 + "input": 30, + "output": 30 }, "type": "chat" }, { - "id": "qwen3-14b", - "name": "Qwen3 14B", - "display_name": "Qwen3 14B", + "id": "GLM-4.5-Air-Derestricted-Steam-ReExtract", + "name": "GLM 4.5 Air Derestricted Steam ReExtract", + "display_name": "GLM 4.5 Air Derestricted Steam ReExtract", "modalities": { "input": [ "text" @@ -5894,92 +5390,26 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", - "cost": { - "input": 0.35, - "output": 1.4, - "reasoning": 4.2 - }, - "type": "chat" - }, - { - "id": "qwen3.5-35b-a3b", - "name": "Qwen3.5 35B-A3B", - "display_name": "Qwen3.5 35B-A3B", - "modalities": { - "input": [ - "text", - "image", - "video", - "audio" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 65536 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-23", - "last_updated": "2026-02-23", + "open_weights": false, + "release_date": "2025-12-12", + "last_updated": "2025-12-12", "cost": { - "input": 0.25, - "output": 2 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "qwen3-coder-plus-2025-09-23", - "name": "Qwen3 Coder Plus 2025 09 23", - "display_name": "Qwen3 Coder Plus 2025 09 23", + "id": "Llama-3.3-70B-Shakudo", + "name": "Llama 3.3 70B Shakudo", + "display_name": "Llama 3.3 70B Shakudo", "modalities": { "input": [ "text" @@ -5989,70 +5419,57 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "type": "chat" - }, - { - "id": "qwen3-coder-plus-2025-07-22", - "name": "Qwen3 Coder Plus 2025 07 22", - "display_name": "Qwen3 Coder Plus 2025 07 22", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 65536 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.306, + "output": 0.306 }, - "attachment": false, "type": "chat" }, { - "id": "qwen-vl-ocr-latest", - "name": "Qwen Vl Ocr Latest", - "display_name": "Qwen Vl Ocr Latest", + "id": "Llama-3.3-70B-Predatorial-Extasy", + "name": "Llama 3.3 70B Predatorial Extasy", + "display_name": "Llama 3.3 70B Predatorial Extasy", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 34096, - "output": 4096 + "context": 32768, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.306, + "output": 0.306 + }, "type": "chat" }, { - "id": "qvq-max-2025-05-15", - "name": "Qvq Max 2025 05 15", - "display_name": "Qvq Max 2025 05 15", + "id": "gemini-2.5-pro-preview-03-25", + "name": "Gemini 2.5 Pro Preview 0325", + "display_name": "Gemini 2.5 Pro Preview 0325", "modalities": { "input": [ "text", @@ -6063,27 +5480,47 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048756, + "output": 65536 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 16384, - "min": 0, - "max": 16384 + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, + "attachment": true, + "open_weights": false, + "release_date": "2025-03-25", + "last_updated": "2025-03-25", + "cost": { + "input": 2.5, + "output": 10 + }, "type": "chat" }, { - "id": "qwen-long", - "name": "Qwen Long", - "display_name": "Qwen Long", + "id": "Llama-3.3-70B-Cu-Mai-R1", + "name": "Llama 3.3 70B Cu Mai R1", + "display_name": "Llama 3.3 70B Cu Mai R1", "modalities": { "input": [ "text" @@ -6093,139 +5530,116 @@ ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 32768, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.306, + "output": 0.306 + }, "type": "chat" }, { - "id": "qwen-turbo-latest", - "name": "Qwen Turbo Latest", - "display_name": "Qwen Turbo Latest", + "id": "gemini-2.5-flash-preview-09-2025", + "name": "Gemini 2.5 Flash Preview (09/2025)", + "display_name": "Gemini 2.5 Flash Preview (09/2025)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1048756, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "attachment": true, + "open_weights": false, + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "cost": { + "input": 0.3, + "output": 2.5 }, - "attachment": false, "type": "chat" }, { - "id": "qwen-turbo-2024-09-19", - "name": "Qwen Turbo 2024 09 19", - "display_name": "Qwen Turbo 2024 09 19", + "id": "ernie-x1.1-preview", + "name": "ERNIE X1.1", + "display_name": "ERNIE X1.1", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 64000, "output": 8192 }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "type": "chat" - }, - { - "id": "qwen-flash-2025-07-28", - "name": "Qwen Flash 2025 07 28", - "display_name": "Qwen Flash 2025 07 28", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 32768 - }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "attachment": true, + "open_weights": false, + "release_date": "2025-09-10", + "last_updated": "2025-09-10", + "cost": { + "input": 0.15, + "output": 0.6 }, - "attachment": false, "type": "chat" }, { - "id": "qwen-plus-latest", - "name": "Qwen Plus Latest", - "display_name": "Qwen Plus Latest", + "id": "deepseek-r1", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ "text" @@ -6235,19 +5649,13 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 128000, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -6260,19 +5668,20 @@ ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, + "open_weights": false, + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "cost": { + "input": 0.4, + "output": 1.7 + }, "type": "chat" }, { - "id": "qwen-plus-2024-09-19", - "name": "Qwen Plus 2024 09 19", - "display_name": "Qwen Plus 2024 09 19", + "id": "glm-z1-airx", + "name": "GLM Z1 AirX", + "display_name": "GLM Z1 AirX", "modalities": { "input": [ "text" @@ -6282,68 +5691,59 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", + "cost": { + "input": 0.7, + "output": 0.7 + }, "type": "chat" }, { - "id": "qwen-plus-2025-07-14", - "name": "Qwen Plus 2025 07 14", - "display_name": "Qwen Plus 2025 07 14", + "id": "claude-haiku-4-5-20251001", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 200000, + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "attachment": true, + "open_weights": false, + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "cost": { + "input": 1, + "output": 5 }, - "attachment": false, "type": "chat" }, { - "id": "qwen-plus-2025-09-11", - "name": "Qwen Plus 2025 09 11", - "display_name": "Qwen Plus 2025 09 11", + "id": "v0-1.5-md", + "name": "v0 1.5 MD", + "display_name": "v0 1.5 MD", "modalities": { "input": [ "text" @@ -6353,77 +5753,63 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 200000, + "output": 64000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2025-07-04", + "last_updated": "2025-07-04", + "cost": { + "input": 3, + "output": 15 + }, "type": "chat" }, { - "id": "qwen-max-latest", - "name": "Qwen Max Latest", - "display_name": "Qwen Max Latest", + "id": "claude-3-5-sonnet-20240620", + "name": "Claude 3.5 Sonnet Old", + "display_name": "Claude 3.5 Sonnet Old", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 200000, "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "attachment": true, + "open_weights": false, + "release_date": "2024-06-20", + "last_updated": "2024-06-20", + "cost": { + "input": 2.992, + "output": 14.994 }, - "attachment": false, "type": "chat" }, { - "id": "qwen-max-2024-09-19", - "name": "Qwen Max 2024 09 19", - "display_name": "Qwen Max 2024 09 19", + "id": "qwen3-vl-235b-a22b-thinking", + "name": "Qwen3 VL 235B A22B Thinking", + "display_name": "Qwen3 VL 235B A22B Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -6431,26 +5817,38 @@ }, "limit": { "context": 32768, - "output": 8192 + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false - }, - "search": { "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-26", + "last_updated": "2025-08-26", + "cost": { + "input": 0.5, + "output": 6 }, - "attachment": false, "type": "chat" }, { - "id": "qwen-max-2024-04-28", - "name": "Qwen Max 2024 04 28", - "display_name": "Qwen Max 2024 04 28", + "id": "glm-4-plus", + "name": "GLM-4 Plus", + "display_name": "GLM-4 Plus", "modalities": { "input": [ "text" @@ -6460,21 +5858,27 @@ ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 128000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2024-08-01", + "last_updated": "2024-08-01", + "cost": { + "input": 7.497, + "output": 7.497 + }, "type": "chat" }, { - "id": "qwen-max-2024-04-03", - "name": "Qwen Max 2024 04 03", - "display_name": "Qwen Max 2024 04 03", + "id": "fastgpt", + "name": "Web Answer", + "display_name": "Web Answer", "modalities": { "input": [ "text" @@ -6484,21 +5888,27 @@ ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 32768, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2023-08-01", + "last_updated": "2024-01-01", + "cost": { + "input": 7.5, + "output": 7.5 + }, "type": "chat" }, { - "id": "qwen-max-2025-01-25", - "name": "Qwen Max 2025 01 25", - "display_name": "Qwen Max 2025 01 25", + "id": "Llama-3.3-70B-Anthrobomination", + "name": "Llama 3.3 70B Anthrobomination", + "display_name": "Llama 3.3 70B Anthrobomination", "modalities": { "input": [ "text" @@ -6508,27 +5918,27 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.306, + "output": 0.306 + }, "type": "chat" }, { - "id": "qwen3-max-2025-09-23", - "name": "Qwen3 Max 20250923", - "display_name": "Qwen3 Max 20250923", + "id": "Llama-3.3-70B-Ignition-v0.1", + "name": "Llama 3.3 70B Ignition v0.1", + "display_name": "Llama 3.3 70B Ignition v0.1", "modalities": { "input": [ "text" @@ -6538,68 +5948,78 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.306, + "output": 0.306 + }, "type": "chat" }, { - "id": "qwen3-max-preview", - "name": "Qwen3 Max Preview", - "display_name": "Qwen3 Max Preview", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1048756, "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "attachment": true, + "open_weights": false, + "release_date": "2025-06-05", + "last_updated": "2025-06-05", + "cost": { + "input": 2.5, + "output": 10 }, - "attachment": false, "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "exa-research", + "name": "Exa (Research)", + "display_name": "Exa (Research)", "modalities": { "input": [ "text" @@ -6609,62 +6029,58 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 8192, + "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2025-06-04", + "last_updated": "2025-06-04", + "cost": { + "input": 2.5, + "output": 2.5 + }, "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "gemini-2.0-pro-exp-02-05", + "name": "Gemini 2.0 Pro 0205", + "display_name": "Gemini 2.0 Pro 0205", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 2097152, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, + "open_weights": false, + "release_date": "2025-02-05", + "last_updated": "2025-02-05", + "cost": { + "input": 1.989, + "output": 7.956 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b-instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", + "id": "ernie-4.5-8k-preview", + "name": "Ernie 4.5 8k Preview", + "display_name": "Ernie 4.5 8k Preview", "modalities": { "input": [ "text" @@ -6674,21 +6090,27 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 8000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2025-03-25", + "last_updated": "2025-03-25", + "cost": { + "input": 0.66, + "output": 2.6 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b-thinking-2507", - "name": "Qwen3 30B A3B Thinking 2507", - "display_name": "Qwen3 30B A3B Thinking 2507", + "id": "auto-model-basic", + "name": "Auto model (Basic)", + "display_name": "Auto model (Basic)", "modalities": { "input": [ "text" @@ -6698,38 +6120,27 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1000000, + "output": 1000000 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2024-06-01", + "last_updated": "2024-06-01", + "cost": { + "input": 9.996, + "output": 19.992 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "glm-4-long", + "name": "GLM-4 Long", + "display_name": "GLM-4 Long", "modalities": { "input": [ "text" @@ -6739,38 +6150,27 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1000000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2024-08-01", + "last_updated": "2024-08-01", + "cost": { + "input": 0.2006, + "output": 0.2006 + }, "type": "chat" }, { - "id": "qwen3-4b", - "name": "Qwen3 4B", - "display_name": "Qwen3 4B", + "id": "qwq-32b", + "name": "Qwen: QwQ 32B", + "display_name": "Qwen: QwQ 32B", "modalities": { "input": [ "text" @@ -6780,19 +6180,12 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "supported": true }, "extra_capabilities": { "reasoning": { @@ -6806,53 +6199,50 @@ } }, "attachment": false, + "open_weights": false, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", + "cost": { + "input": 0.25599999, + "output": 0.30499999 + }, "type": "chat" }, { - "id": "qwen3-1.7b", - "name": "Qwen3 1.7B", - "display_name": "Qwen3 1.7B", + "id": "doubao-1-5-thinking-pro-250415", + "name": "Doubao 1.5 Thinking Pro", + "display_name": "Doubao 1.5 Thinking Pro", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 30720, - "min": 0, - "max": 30720 - } + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": true, + "open_weights": false, + "release_date": "2025-04-17", + "last_updated": "2025-04-17", + "cost": { + "input": 0.6, + "output": 2.4 }, - "attachment": false, "type": "chat" }, { - "id": "qwen3-0.6b", - "name": "Qwen3 0.6B", - "display_name": "Qwen3 0.6B", + "id": "Llama-3.3-70B-GeneticLemonade-Unleashed-v3", + "name": "Llama 3.3 70B GeneticLemonade Unleashed v3", + "display_name": "Llama 3.3 70B GeneticLemonade Unleashed v3", "modalities": { "input": [ "text" @@ -6863,132 +6253,108 @@ }, "limit": { "context": 32768, - "output": 8192 + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 30720, - "min": 0, - "max": 30720 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.306, + "output": 0.306 + }, "type": "chat" }, { - "id": "qwen3-vl-plus-2025-09-23", - "name": "Qwen3 VL Plus 2025 09 23", - "display_name": "Qwen3 VL Plus 2025 09 23", + "id": "exa-research-pro", + "name": "Exa (Research Pro)", + "display_name": "Exa (Research Pro)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 16384, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2025-06-04", + "last_updated": "2025-06-04", + "cost": { + "input": 2.5, + "output": 2.5 + }, "type": "chat" }, { - "id": "qwq-plus-latest", - "name": "QwQ Plus Latest", - "display_name": "QwQ Plus Latest", + "id": "gemini-2.5-flash-preview-04-17", + "name": "Gemini 2.5 Flash Preview", + "display_name": "Gemini 2.5 Flash Preview", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048756, + "output": 65536 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 32768, - "min": 0, - "max": 32768 - } + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "search": { - "supported": false + "attachment": true, + "open_weights": false, + "release_date": "2025-04-17", + "last_updated": "2025-04-17", + "cost": { + "input": 0.15, + "output": 0.6 }, - "attachment": false, "type": "chat" - } - ] - }, - "scaleway": { - "id": "scaleway", - "name": "Scaleway", - "display_name": "Scaleway", - "api": "https://api.scaleway.ai/v1", - "doc": "https://www.scaleway.com/en/docs/generative-apis/", - "models": [ + }, { - "id": "qwen3-embedding-8b", - "name": "Qwen3 Embedding 8B", - "display_name": "Qwen3 Embedding 8B", + "id": "doubao-seed-2-0-code-preview-260215", + "name": "Doubao Seed 2.0 Code Preview", + "display_name": "Doubao Seed 2.0 Code Preview", "modalities": { "input": [ "text" @@ -6998,28 +6364,27 @@ ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 256000, + "output": 128000 }, - "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-25-11", - "last_updated": "2026-03-17", + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "cost": { - "input": 0.1, - "output": 0 + "input": 0.782, + "output": 3.893 }, - "type": "embedding" + "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "Llama-3.3-70B-Bigger-Body", + "name": "Llama 3.3 70B Bigger Body", + "display_name": "Llama 3.3 70B Bigger Body", "modalities": { "input": [ "text" @@ -7029,28 +6394,27 @@ ] }, "limit": { - "context": 260000, + "context": 32768, "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.75, - "output": 2.25 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "Llama-3.3-70B-Fallen-v1", + "name": "Llama 3.3 70B Fallen v1", + "display_name": "Llama 3.3 70B Fallen v1", "modalities": { "input": [ "text" @@ -7060,75 +6424,27 @@ ] }, "limit": { - "context": 100000, + "context": 32768, "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2026-03-17", - "cost": { - "input": 0.9, - "output": 0.9 - }, - "type": "chat" - }, - { - "id": "qwen3.5-397b-a17b", - "name": "Qwen3.5 397B A17B", - "display_name": "Qwen3.5 397B A17B", - "modalities": { - "input": [ - "text", - "image", - "video" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 16384 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.6, - "output": 3.6 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "devstral-2-123b-instruct-2512", - "name": "Devstral 2 123B Instruct (2512)", - "display_name": "Devstral 2 123B Instruct (2512)", + "id": "Llama-3.3-70B-Electra-R1", + "name": "Llama 3.3 70B Electra R1", + "display_name": "Llama 3.3 70B Electra R1", "modalities": { "input": [ "text" @@ -7138,28 +6454,27 @@ ] }, "limit": { - "context": 256000, + "context": 32768, "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-07", - "last_updated": "2026-03-17", + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.4, - "output": 2 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "azure-o1", + "name": "Azure o1", + "display_name": "Azure o1", "modalities": { "input": [ "text" @@ -7169,39 +6484,30 @@ ] }, "limit": { - "context": 32000, - "output": 8196 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2026-03-17", + "open_weights": false, + "release_date": "2024-12-17", + "last_updated": "2024-12-17", "cost": { - "input": 0.9, - "output": 0.9 + "input": 14.994, + "output": 59.993 }, "type": "chat" }, { - "id": "pixtral-12b-2409", - "name": "Pixtral 12B 2409", - "display_name": "Pixtral 12B 2409", + "id": "deepseek-v3-0324", + "name": "DeepSeek Chat 0324", + "display_name": "DeepSeek Chat 0324", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -7209,125 +6515,122 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2024-09-25", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": false, + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.25, + "output": 0.7 }, "type": "chat" }, { - "id": "whisper-large-v3", - "name": "Whisper Large v3", - "display_name": "Whisper Large v3", + "id": "chroma", + "name": "Chroma", + "display_name": "Chroma", "modalities": { "input": [ - "audio" + "text" ], "output": [ - "text" + "image" ] }, "limit": { "context": 8192, "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-09", - "release_date": "2023-09-01", - "last_updated": "2026-03-17", - "cost": { - "input": 0.003, - "output": 0 - }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-12", + "last_updated": "2025-08-12", "type": "chat" }, { - "id": "voxtral-small-24b-2507", - "name": "Voxtral Small 24B 2507", - "display_name": "Voxtral Small 24B 2507", + "id": "claude-sonnet-4-5-20250929-thinking", + "name": "Claude Sonnet 4.5 Thinking", + "display_name": "Claude Sonnet 4.5 Thinking", "modalities": { "input": [ "text", - "audio" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 16384 + "context": 1000000, + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2026-03-17", + "open_weights": false, + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.15, - "output": 0.35 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "gemma-3-27b-it", - "name": "Gemma-3-27B-IT", - "display_name": "Gemma-3-27B-IT", + "id": "jamba-large", + "name": "Jamba Large", + "display_name": "Jamba Large", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 40000, - "output": 8192 + "context": 256000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2026-03-17", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.25, - "output": 0.5 + "input": 1.989, + "output": 7.99 }, "type": "chat" }, { - "id": "bge-multilingual-gemma2", - "name": "BGE Multilingual Gemma2", - "display_name": "BGE Multilingual Gemma2", + "id": "Llama-3.3-70B-Nova", + "name": "Llama 3.3 70B Nova", + "display_name": "Llama 3.3 70B Nova", "modalities": { "input": [ "text" @@ -7337,92 +6640,84 @@ ] }, "limit": { - "context": 8191, - "output": 3072 + "context": 32768, + "output": 16384 }, - "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-07-26", - "last_updated": "2025-06-15", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.1, - "output": 0 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3-Coder 30B-A3B Instruct", - "display_name": "Qwen3-Coder 30B-A3B Instruct", + "id": "z-image-turbo", + "name": "Z Image Turbo", + "display_name": "Z Image Turbo", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2026-03-17", - "cost": { - "input": 0.2, - "output": 0.8 - }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-27", + "last_updated": "2025-11-27", "type": "chat" }, { - "id": "mistral-small-3.2-24b-instruct-2506", - "name": "Mistral Small 3.2 24B Instruct (2506)", - "display_name": "Mistral Small 3.2 24B Instruct (2506)", + "id": "jamba-mini-1.7", + "name": "Jamba Mini 1.7", + "display_name": "Jamba Mini 1.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 256000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-06-20", - "last_updated": "2026-03-17", + "open_weights": false, + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.15, - "output": 0.35 + "input": 0.1989, + "output": 0.408 }, "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "GPT-OSS 120B", - "display_name": "GPT-OSS 120B", + "id": "Llama-3.3-70B-Strawberrylemonade-v1.2", + "name": "Llama 3.3 70B StrawberryLemonade v1.2", + "display_name": "Llama 3.3 70B StrawberryLemonade v1.2", "modalities": { "input": [ "text" @@ -7432,33 +6727,27 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2024-01-01", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "mistral-nemo-instruct-2407", - "name": "Mistral Nemo Instruct 2407", - "display_name": "Mistral Nemo Instruct 2407", + "id": "doubao-seed-2-0-mini-260215", + "name": "Doubao Seed 2.0 Mini", + "display_name": "Doubao Seed 2.0 Mini", "modalities": { "input": [ "text" @@ -7468,28 +6757,27 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 256000, + "output": 32000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2024-07-25", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": false, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.0493, + "output": 0.4845 }, "type": "chat" }, { - "id": "llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "sonar", + "name": "Perplexity Simple", + "display_name": "Perplexity Simple", "modalities": { "input": [ "text" @@ -7499,38 +6787,27 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 127000, + "output": 128000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2026-03-17", + "open_weights": false, + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.2, - "output": 0.2 + "input": 1.003, + "output": 1.003 }, "type": "chat" - } - ] - }, - "nano-gpt": { - "id": "nano-gpt", - "name": "NanoGPT", - "display_name": "NanoGPT", - "api": "https://nano-gpt.com/api/v1", - "doc": "https://docs.nano-gpt.com", - "models": [ + }, { - "id": "glm-4-flash", - "name": "GLM-4 Flash", - "display_name": "GLM-4 Flash", + "id": "jamba-large-1.7", + "name": "Jamba Large 1.7", + "display_name": "Jamba Large 1.7", "modalities": { "input": [ "text" @@ -7540,7 +6817,7 @@ ] }, "limit": { - "context": 128000, + "context": 256000, "output": 4096 }, "tool_call": false, @@ -7549,18 +6826,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-08-01", - "last_updated": "2024-08-01", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.1003, - "output": 0.1003 + "input": 1.989, + "output": 7.99 }, "type": "chat" }, { - "id": "Meta-Llama-3-1-8B-Instruct-FP8", - "name": "Llama 3.1 8B (decentralized)", - "display_name": "Llama 3.1 8B (decentralized)", + "id": "glm-4-flash", + "name": "GLM-4 Flash", + "display_name": "GLM-4 Flash", "modalities": { "input": [ "text" @@ -7571,7 +6848,7 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, "tool_call": false, "reasoning": { @@ -7579,18 +6856,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2024-08-01", + "last_updated": "2024-08-01", "cost": { - "input": 0.02, - "output": 0.03 + "input": 0.1003, + "output": 0.1003 }, "type": "chat" }, { - "id": "claude-opus-4-thinking:32000", - "name": "Claude 4 Opus Thinking (32K)", - "display_name": "Claude 4 Opus Thinking (32K)", + "id": "claude-opus-4-1-thinking:8192", + "name": "Claude 4.1 Opus Thinking (8K)", + "display_name": "Claude 4.1 Opus Thinking (8K)", "modalities": { "input": [ "text", @@ -7627,60 +6904,39 @@ "type": "chat" }, { - "id": "gemini-2.5-pro-preview-05-06", - "name": "Gemini 2.5 Pro Preview 0506", - "display_name": "Gemini 2.5 Pro Preview 0506", + "id": "step-2-16k-exp", + "name": "Step-2 16k Exp", + "display_name": "Step-2 16k Exp", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 16000, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-06", - "last_updated": "2025-05-06", + "release_date": "2024-07-05", + "last_updated": "2024-07-05", "cost": { - "input": 2.5, - "output": 10 + "input": 7.004, + "output": 19.992 }, "type": "chat" }, { - "id": "grok-3-mini-fast-beta", - "name": "Grok 3 Mini Fast Beta", - "display_name": "Grok 3 Mini Fast Beta", + "id": "Llama-3.3-70B-Damascus-R1", + "name": "Damascus R1", + "display_name": "Damascus R1", "modalities": { "input": [ "text" @@ -7690,8 +6946,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -7699,21 +6955,23 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.6, - "output": 4 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "MiniMax-M2", - "name": "MiniMax M2", - "display_name": "MiniMax M2", + "id": "claude-opus-4-1-thinking:32000", + "name": "Claude 4.1 Opus Thinking (32K)", + "display_name": "Claude 4.1 Opus Thinking (32K)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -7721,7 +6979,45 @@ }, "limit": { "context": 200000, - "output": 131072 + "output": 32000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 14.994, + "output": 75.004 + }, + "type": "chat" + }, + { + "id": "ernie-5.0-thinking-preview", + "name": "Ernie 5.0 Thinking Preview", + "display_name": "Ernie 5.0 Thinking Preview", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -7733,20 +7029,20 @@ "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-10-25", - "last_updated": "2025-10-25", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.17, - "output": 1.53 + "input": 1.1, + "output": 2 }, "type": "chat" }, { - "id": "command-a-reasoning-08-2025", - "name": "Cohere Command A (08/2025)", - "display_name": "Cohere Command A (08/2025)", + "id": "Llama-3.3-70B-Mokume-Gane-R1", + "name": "Llama 3.3 70B Mokume Gane R1", + "display_name": "Llama 3.3 70B Mokume Gane R1", "modalities": { "input": [ "text" @@ -7756,8 +7052,8 @@ ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -7765,18 +7061,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-08-22", - "last_updated": "2025-08-22", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 2.5, - "output": 10 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "brave", - "name": "Brave (Answers)", - "display_name": "Brave (Answers)", + "id": "grok-3-beta", + "name": "Grok 3 Beta", + "display_name": "Grok 3 Beta", "modalities": { "input": [ "text" @@ -7786,8 +7082,8 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 131072 }, "tool_call": false, "reasoning": { @@ -7795,18 +7091,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2023-03-02", - "last_updated": "2024-01-01", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 5, - "output": 5 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "exa-research", - "name": "Exa (Research)", - "display_name": "Exa (Research)", + "id": "GLM-4.5-Air-Derestricted-Iceblink", + "name": "GLM 4.5 Air Derestricted Iceblink", + "display_name": "GLM 4.5 Air Derestricted Iceblink", "modalities": { "input": [ "text" @@ -7816,8 +7112,8 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 98304 }, "tool_call": false, "reasoning": { @@ -7825,18 +7121,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-06-04", - "last_updated": "2025-06-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 2.5, - "output": 2.5 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Nova", - "name": "Llama 3.3 70B Nova", - "display_name": "Llama 3.3 70B Nova", + "id": "glm-4", + "name": "GLM-4", + "display_name": "GLM-4", "modalities": { "input": [ "text" @@ -7846,8 +7142,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -7855,30 +7151,31 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2024-01-16", + "last_updated": "2024-01-16", "cost": { - "input": 0.306, - "output": 0.306 + "input": 14.994, + "output": 14.994 }, "type": "chat" }, { - "id": "gemini-exp-1206", - "name": "Gemini 2.0 Pro 1206", - "display_name": "Gemini 2.0 Pro 1206", + "id": "ernie-x1-turbo-32k", + "name": "Ernie X1 Turbo 32k", + "display_name": "Ernie X1 Turbo 32k", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2097152, - "output": 8192 + "context": 32000, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -7886,18 +7183,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "cost": { - "input": 1.258, - "output": 4.998 + "input": 0.165, + "output": 0.66 }, "type": "chat" }, { - "id": "claude-opus-4-5-20251101", - "name": "Claude 4.5 Opus", - "display_name": "Claude 4.5 Opus", + "id": "claude-opus-4-1-thinking:32768", + "name": "Claude 4.1 Opus Thinking (32K)", + "display_name": "Claude 4.1 Opus Thinking (32K)", "modalities": { "input": [ "text", @@ -7917,20 +7214,26 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } + }, "attachment": true, "open_weights": false, - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 4.998, - "output": 25.007 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "auto-model-basic", - "name": "Auto model (Basic)", - "display_name": "Auto model (Basic)", + "id": "GLM-4.5-Air-Derestricted-Iceblink-v2", + "name": "GLM 4.5 Air Derestricted Iceblink v2", + "display_name": "GLM 4.5 Air Derestricted Iceblink v2", "modalities": { "input": [ "text" @@ -7940,8 +7243,8 @@ ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 158600, + "output": 65536 }, "tool_call": false, "reasoning": { @@ -7949,18 +7252,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 9.996, - "output": 19.992 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "jamba-mini", - "name": "Jamba Mini", - "display_name": "Jamba Mini", + "id": "Llama-3.3-70B-Legion-V2.1", + "name": "Llama 3.3 70B Legion V2.1", + "display_name": "Llama 3.3 70B Legion V2.1", "modalities": { "input": [ "text" @@ -7970,8 +7273,8 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -7979,70 +7282,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.1989, - "output": 0.408 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-09-2025", - "name": "Gemini 2.5 Flash Lite Preview (09/2025)", - "display_name": "Gemini 2.5 Flash Lite Preview (09/2025)", + "id": "deepseek-math-v2", + "name": "DeepSeek Math V2", + "display_name": "DeepSeek Math V2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, + "context": 128000, "output": 65536 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-12-03", + "last_updated": "2025-12-03", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "yi-large", - "name": "Yi Large", - "display_name": "Yi Large", + "id": "step-r1-v-mini", + "name": "Step R1 V Mini", + "display_name": "Step R1 V Mini", "modalities": { "input": [ "text" @@ -8052,8 +7333,8 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 128000, + "output": 65536 }, "tool_call": false, "reasoning": { @@ -8061,79 +7342,87 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "release_date": "2025-04-08", + "last_updated": "2025-04-08", "cost": { - "input": 3.196, - "output": 3.196 + "input": 2.5, + "output": 11 }, "type": "chat" }, { - "id": "auto-model-premium", - "name": "Auto model (Premium)", - "display_name": "Auto model (Premium)", + "id": "claude-opus-4-5-20251101:thinking", + "name": "Claude 4.5 Opus Thinking", + "display_name": "Claude 4.5 Opus Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { - "input": 9.996, - "output": 19.992 + "input": 4.998, + "output": 25.007 }, "type": "chat" }, { - "id": "azure-gpt-4o", - "name": "Azure gpt-4o", - "display_name": "Azure gpt-4o", + "id": "grok-3-mini-beta", + "name": "Grok 3 Mini Beta", + "display_name": "Grok 3 Mini Beta", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 131072 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 2.499, - "output": 9.996 + "input": 0.3, + "output": 0.5 }, "type": "chat" }, { - "id": "deepseek-v3-0324", - "name": "DeepSeek Chat 0324", - "display_name": "DeepSeek Chat 0324", + "id": "brave-research", + "name": "Brave (Research)", + "display_name": "Brave (Research)", "modalities": { "input": [ "text" @@ -8143,27 +7432,27 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 16384, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "release_date": "2023-03-02", + "last_updated": "2024-01-01", "cost": { - "input": 0.25, - "output": 0.7 + "input": 5, + "output": 5 }, "type": "chat" }, { - "id": "claude-3-5-haiku-20241022", - "name": "Claude 3.5 Haiku", - "display_name": "Claude 3.5 Haiku", + "id": "claude-3-7-sonnet-thinking:1024", + "name": "Claude 3.7 Sonnet Thinking (1K)", + "display_name": "Claude 3.7 Sonnet Thinking (1K)", "modalities": { "input": [ "text", @@ -8176,26 +7465,47 @@ }, "limit": { "context": 200000, - "output": 8192 + "output": 64000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 0.8, - "output": 4 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "doubao-seed-1-8-251215", - "name": "Doubao Seed 1.8", - "display_name": "Doubao Seed 1.8", + "id": "venice-uncensored", + "name": "Venice Uncensored", + "display_name": "Venice Uncensored", "modalities": { "input": [ "text" @@ -8206,7 +7516,7 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 16384 }, "tool_call": false, "reasoning": { @@ -8214,18 +7524,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-15", - "last_updated": "2025-12-15", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 0.612, - "output": 6.12 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "doubao-seed-1-6-250615", - "name": "Doubao Seed 1.6", - "display_name": "Doubao Seed 1.6", + "id": "doubao-1.5-pro-256k", + "name": "Doubao 1.5 Pro 256k", + "display_name": "Doubao 1.5 Pro 256k", "modalities": { "input": [ "text" @@ -8244,44 +7554,60 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-06-15", - "last_updated": "2025-06-15", + "release_date": "2025-03-12", + "last_updated": "2025-03-12", "cost": { - "input": 0.204, - "output": 0.51 + "input": 0.799, + "output": 1.445 }, "type": "chat" }, { - "id": "ernie-x1.1-preview", - "name": "ERNIE X1.1", - "display_name": "ERNIE X1.1", + "id": "gemini-2.5-flash-preview-05-20", + "name": "Gemini 2.5 Flash 0520", + "display_name": "Gemini 2.5 Flash 0520", "modalities": { "input": [ "text", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 8192 + "context": 1048000, + "output": 65536 }, "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-09-10", - "last_updated": "2025-09-10", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { "input": 0.15, "output": 0.6 @@ -8289,13 +7615,12 @@ "type": "chat" }, { - "id": "ernie-5.0-thinking-preview", - "name": "Ernie 5.0 Thinking Preview", - "display_name": "Ernie 5.0 Thinking Preview", + "id": "KAT-Coder-Exp-72B-1010", + "name": "KAT Coder Exp 72B 1010", + "display_name": "KAT Coder Exp 72B 1010", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -8303,283 +7628,311 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 32768 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2025-10-28", + "last_updated": "2025-10-28", "cost": { - "input": 1.1, - "output": 2 + "input": 0.1, + "output": 0.2 }, "type": "chat" }, { - "id": "glm-4-air-0111", - "name": "GLM 4 Air 0111", - "display_name": "GLM 4 Air 0111", + "id": "claude-opus-4-thinking:32768", + "name": "Claude 4 Opus Thinking (32K)", + "display_name": "Claude 4 Opus Thinking (32K)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-01-11", - "last_updated": "2025-01-11", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.1394, - "output": 0.1394 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "fastgpt", - "name": "Web Answer", - "display_name": "Web Answer", + "id": "claude-sonnet-4-thinking:1024", + "name": "Claude 4 Sonnet Thinking (1K)", + "display_name": "Claude 4 Sonnet Thinking (1K)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 1000000, + "output": 64000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2023-08-01", - "last_updated": "2024-01-01", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 7.5, - "output": 7.5 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "doubao-seed-1-6-thinking-250615", - "name": "Doubao Seed 1.6 Thinking", - "display_name": "Doubao Seed 1.6 Thinking", + "id": "qwen25-vl-72b-instruct", + "name": "Qwen25 VL 72b", + "display_name": "Qwen25 VL 72b", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 32000, + "output": 32768 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-06-15", - "last_updated": "2025-06-15", + "release_date": "2025-05-10", + "last_updated": "2025-05-10", "cost": { - "input": 0.204, - "output": 2.04 + "input": 0.69989, + "output": 0.69989 }, "type": "chat" }, { - "id": "gemini-2.0-flash-001", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "brave", + "name": "Brave (Answers)", + "display_name": "Brave (Answers)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2023-03-02", + "last_updated": "2024-01-01", "cost": { - "input": 0.1003, - "output": 0.408 + "input": 5, + "output": 5 }, "type": "chat" }, { - "id": "claude-opus-4-1-thinking:32000", - "name": "Claude 4.1 Opus Thinking (32K)", - "display_name": "Claude 4.1 Opus Thinking (32K)", + "id": "azure-gpt-4-turbo", + "name": "Azure gpt-4-turbo", + "display_name": "Azure gpt-4-turbo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2023-11-06", + "last_updated": "2024-01-01", "cost": { - "input": 14.994, - "output": 75.004 + "input": 9.996, + "output": 30.005 }, "type": "chat" }, { - "id": "Llama-3.3-70B-RAWMAW", - "name": "Llama 3.3 70B RAWMAW", - "display_name": "Llama 3.3 70B RAWMAW", + "id": "ernie-5.0-thinking-latest", + "name": "Ernie 5.0 Thinking", + "display_name": "Ernie 5.0 Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 128000, "output": 16384 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1.1, + "output": 2 }, "type": "chat" }, { - "id": "GLM-4.5-Air-Derestricted-Steam", - "name": "GLM 4.5 Air Derestricted Steam", - "display_name": "GLM 4.5 Air Derestricted Steam", + "id": "claude-3-7-sonnet-thinking:32768", + "name": "Claude 3.7 Sonnet Thinking (32K)", + "display_name": "Claude 3.7 Sonnet Thinking (32K)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 220600, - "output": 65536 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-07-15", + "last_updated": "2025-07-15", "cost": { - "input": 0.306, - "output": 0.306 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "claude-3-5-sonnet-20241022", - "name": "Claude 3.5 Sonnet", - "display_name": "Claude 3.5 Sonnet", + "id": "doubao-seed-code-preview-latest", + "name": "Doubao Seed Code Preview", + "display_name": "Doubao Seed Code Preview", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 256000, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "yi-medium-200k", - "name": "Yi Medium 200k", - "display_name": "Yi Medium 200k", + "id": "Llama-3.3-70B-Cirrus-x1", + "name": "Llama 3.3 70B Cirrus x1", + "display_name": "Llama 3.3 70B Cirrus x1", "modalities": { "input": [ "text" @@ -8589,8 +7942,8 @@ ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -8598,48 +7951,49 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-03-01", - "last_updated": "2024-03-01", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 2.499, - "output": 2.499 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "Gemma-3-27B-ArliAI-RPMax-v3", - "name": "Gemma 3 27B RPMax v3", - "display_name": "Gemma 3 27B RPMax v3", + "id": "doubao-1-5-thinking-vision-pro-250428", + "name": "Doubao 1.5 Thinking Vision Pro", + "display_name": "Doubao 1.5 Thinking Vision Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 128000, "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-03", - "last_updated": "2025-07-03", + "release_date": "2025-05-15", + "last_updated": "2025-05-15", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.55, + "output": 1.43 }, "type": "chat" }, { - "id": "phi-4-mini-instruct", - "name": "Phi 4 Mini", - "display_name": "Phi 4 Mini", + "id": "qwen-turbo", + "name": "Qwen Turbo", + "display_name": "Qwen Turbo", "modalities": { "input": [ "text" @@ -8649,27 +8003,38 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.17, - "output": 0.68 + "input": 0.04998, + "output": 0.2006 }, "type": "chat" }, { - "id": "ernie-x1-32k", - "name": "Ernie X1 32k", - "display_name": "Ernie X1 32k", + "id": "gemini-2.0-flash-thinking-exp-01-21", + "name": "Gemini 2.0 Flash Thinking 0121", + "display_name": "Gemini 2.0 Flash Thinking 0121", "modalities": { "input": [ "text", @@ -8680,27 +8045,33 @@ ] }, "limit": { - "context": 32000, - "output": 16384 + "context": 1000000, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "release_date": "2025-05-08", - "last_updated": "2025-05-08", + "release_date": "2025-01-21", + "last_updated": "2025-01-21", "cost": { - "input": 0.33, - "output": 1.32 + "input": 0.306, + "output": 1.003 }, "type": "chat" }, { - "id": "deepseek-chat", - "name": "DeepSeek V3/Deepseek Chat", - "display_name": "DeepSeek V3/Deepseek Chat", + "id": "deepclaude", + "name": "DeepClaude", + "display_name": "DeepClaude", "modalities": { "input": [ "text", @@ -8714,69 +8085,69 @@ "context": 128000, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27", + "release_date": "2025-02-01", + "last_updated": "2025-02-01", "cost": { - "input": 0.25, - "output": 0.7 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "glm-z1-air", - "name": "GLM Z1 Air", - "display_name": "GLM Z1 Air", + "id": "deepseek-chat-cheaper", + "name": "DeepSeek V3/Chat Cheaper", + "display_name": "DeepSeek V3/Chat Cheaper", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 16384 + "context": 128000, + "output": 8192 }, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, "release_date": "2025-04-15", "last_updated": "2025-04-15", "cost": { - "input": 0.07, - "output": 0.07 + "input": 0.25, + "output": 0.7 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-thinking:128000", - "name": "Claude 3.7 Sonnet Thinking (128K)", - "display_name": "Claude 3.7 Sonnet Thinking (128K)", + "id": "gemini-2.5-pro-preview-06-05", + "name": "Gemini 2.5 Pro Preview 0605", + "display_name": "Gemini 2.5 Pro Preview 0605", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048756, + "output": 65536 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -8787,34 +8158,33 @@ "default_enabled": true, "mode": "budget", "budget": { - "min": 1024, + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, "unit": "tokens" }, - "interleaved": false, - "summaries": false, - "visibility": "full", + "summaries": true, + "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "cost": { - "input": 2.992, - "output": 14.994 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "glm-4-air", - "name": "GLM-4 Air", - "display_name": "GLM-4 Air", + "id": "qwen-max", + "name": "Qwen 2.5 Max", + "display_name": "Qwen 2.5 Max", "modalities": { "input": [ "text" @@ -8824,8 +8194,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 32000, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -8833,18 +8203,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-06-05", - "last_updated": "2024-06-05", + "release_date": "2024-04-03", + "last_updated": "2024-04-03", "cost": { - "input": 0.2006, - "output": 0.2006 + "input": 1.5997, + "output": 6.392 }, "type": "chat" }, { - "id": "Llama-3.3-70B-MiraiFanfare", - "name": "Llama 3.3 70b Mirai Fanfare", - "display_name": "Llama 3.3 70b Mirai Fanfare", + "id": "step-2-mini", + "name": "Step-2 Mini", + "display_name": "Step-2 Mini", "modalities": { "input": [ "text" @@ -8854,8 +8224,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 8000, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -8863,85 +8233,100 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "release_date": "2024-07-05", + "last_updated": "2024-07-05", "cost": { - "input": 0.493, - "output": 0.493 + "input": 0.2006, + "output": 0.408 }, "type": "chat" }, { - "id": "gemini-2.0-flash-thinking-exp-01-21", - "name": "Gemini 2.0 Flash Thinking 0121", - "display_name": "Gemini 2.0 Flash Thinking 0121", + "id": "Llama-3.3-70B-Electranova-v1.0", + "name": "Llama 3.3 70B Electranova v1.0", + "display_name": "Llama 3.3 70B Electranova v1.0", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-01-21", - "last_updated": "2025-01-21", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { "input": 0.306, - "output": 1.003 + "output": 0.306 }, "type": "chat" }, { - "id": "Magistral-Small-2506", - "name": "Magistral Small 2506", - "display_name": "Magistral Small 2506", + "id": "claude-3-7-sonnet-reasoner", + "name": "Claude 3.7 Sonnet Reasoner", + "display_name": "Claude 3.7 Sonnet Reasoner", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-03-29", + "last_updated": "2025-03-29", "cost": { - "input": 0.4, - "output": 1.4 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "doubao-1.5-pro-32k", - "name": "Doubao 1.5 Pro 32k", - "display_name": "Doubao 1.5 Pro 32k", + "id": "QwQ-32B-ArliAI-RpR-v1", + "name": "QwQ 32b Arli V1", + "display_name": "QwQ 32b Arli V1", "modalities": { "input": [ "text" @@ -8951,57 +8336,69 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 32768, + "output": 32768 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-01-22", - "last_updated": "2025-01-22", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0.1343, - "output": 0.3349 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "venice-uncensored:web", - "name": "Venice Uncensored Web", - "display_name": "Venice Uncensored Web", + "id": "ernie-4.5-turbo-128k", + "name": "Ernie 4.5 Turbo 128k", + "display_name": "Ernie 4.5 Turbo 128k", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 80000, + "context": 128000, "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-05-01", - "last_updated": "2024-05-01", + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "cost": { - "input": 0.4, - "output": 0.4 + "input": 0.132, + "output": 0.55 }, "type": "chat" }, { - "id": "glm-4", - "name": "GLM-4", - "display_name": "GLM-4", + "id": "deepseek-reasoner", + "name": "DeepSeek Reasoner", + "display_name": "DeepSeek Reasoner", "modalities": { "input": [ "text" @@ -9011,27 +8408,38 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 64000, + "output": 65536 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2024-01-16", - "last_updated": "2024-01-16", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 14.994, - "output": 14.994 + "input": 0.4, + "output": 1.7 }, "type": "chat" }, { - "id": "qwen-max", - "name": "Qwen 2.5 Max", - "display_name": "Qwen 2.5 Max", + "id": "glm-4-plus-0111", + "name": "GLM 4 Plus 0111", + "display_name": "GLM 4 Plus 0111", "modalities": { "input": [ "text" @@ -9041,8 +8449,8 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 128000, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -9050,22 +8458,21 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-04-03", - "last_updated": "2024-04-03", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 1.5997, - "output": 6.392 + "input": 9.996, + "output": 9.996 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b-instruct-original", - "name": "Qwen3 VL 235B A22B Instruct Original", - "display_name": "Qwen3 VL 235B A22B Instruct Original", + "id": "Llama-3.3-70B-Forgotten-Abomination-v5.0", + "name": "Llama 3.3 70B Forgotten Abomination v5.0", + "display_name": "Llama 3.3 70B Forgotten Abomination v5.0", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -9073,26 +8480,26 @@ }, "limit": { "context": 32768, - "output": 32768 + "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.5, - "output": 1.2 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "jamba-large-1.6", - "name": "Jamba Large 1.6", - "display_name": "Jamba Large 1.6", + "id": "doubao-seed-1-8-251215", + "name": "Doubao Seed 1.8", + "display_name": "Doubao Seed 1.8", "modalities": { "input": [ "text" @@ -9102,8 +8509,8 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 128000, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -9111,29 +8518,30 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-03-12", - "last_updated": "2025-03-12", + "release_date": "2025-12-15", + "last_updated": "2025-12-15", "cost": { - "input": 1.989, - "output": 7.99 + "input": 0.612, + "output": 6.12 }, "type": "chat" }, { - "id": "qwen-plus", - "name": "Qwen Plus", - "display_name": "Qwen Plus", + "id": "gemini-2.5-pro-preview-05-06", + "name": "Gemini 2.5 Pro Preview 0506", + "display_name": "Gemini 2.5 Pro Preview 0506", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 995904, - "output": 32768 + "context": 1048756, + "output": 65536 }, "tool_call": false, "reasoning": { @@ -9143,59 +8551,66 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "release_date": "2025-05-06", + "last_updated": "2025-05-06", "cost": { - "input": 0.3995, - "output": 1.2002 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "qwen25-vl-72b-instruct", - "name": "Qwen25 VL 72b", - "display_name": "Qwen25 VL 72b", + "id": "auto-model-standard", + "name": "Auto model (Standard)", + "display_name": "Auto model (Standard)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 32768 + "context": 1000000, + "output": 1000000 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-10", - "last_updated": "2025-05-10", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.69989, - "output": 0.69989 + "input": 9.996, + "output": 19.992 }, "type": "chat" }, { - "id": "claude-sonnet-4-thinking:64000", - "name": "Claude 4 Sonnet Thinking (64K)", - "display_name": "Claude 4 Sonnet Thinking (64K)", + "id": "gemini-2.5-flash-lite-preview-09-2025", + "name": "Gemini 2.5 Flash Lite Preview (09/2025)", + "display_name": "Gemini 2.5 Flash Lite Preview (09/2025)", "modalities": { "input": [ "text", @@ -9207,34 +8622,77 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 1048756, + "output": 65536 }, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "gemini-3-pro-preview", - "name": "Gemini 3 Pro", - "display_name": "Gemini 3 Pro", + "id": "sonar-deep-research", + "name": "Perplexity Deep Research", + "display_name": "Perplexity Deep Research", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 60000, + "output": 128000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-02-25", + "last_updated": "2025-02-25", + "cost": { + "input": 3.4, + "output": 13.6 + }, + "type": "chat" + }, + { + "id": "gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ "text", @@ -9248,21 +8706,23 @@ "context": 1048756, "output": 65536 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ @@ -9272,18 +8732,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 2, - "output": 12 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "GLM-4.5-Air-Derestricted-Iceblink-ReExtract", - "name": "GLM 4.5 Air Derestricted Iceblink ReExtract", - "display_name": "GLM 4.5 Air Derestricted Iceblink ReExtract", + "id": "Gemma-3-27B-Glitter", + "name": "Gemma 3 27B Glitter", + "display_name": "Gemma 3 27B Glitter", "modalities": { "input": [ "text" @@ -9293,8 +8753,8 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -9302,8 +8762,8 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-12", - "last_updated": "2025-12-12", + "release_date": "2025-03-10", + "last_updated": "2025-03-10", "cost": { "input": 0.306, "output": 0.306 @@ -9311,9 +8771,9 @@ "type": "chat" }, { - "id": "universal-summarizer", - "name": "Universal Summarizer", - "display_name": "Universal Summarizer", + "id": "Llama-3.3-70B-Vulpecula-R1", + "name": "Llama 3.3 70B Vulpecula R1", + "display_name": "Llama 3.3 70B Vulpecula R1", "modalities": { "input": [ "text" @@ -9324,7 +8784,7 @@ }, "limit": { "context": 32768, - "output": 32768 + "output": 16384 }, "tool_call": false, "reasoning": { @@ -9332,57 +8792,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2023-05-01", - "last_updated": "2024-01-01", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 30, - "output": 30 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "claude-sonnet-4-thinking:32768", - "name": "Claude 4 Sonnet Thinking (32K)", - "display_name": "Claude 4 Sonnet Thinking (32K)", + "id": "Gemma-3-27B-it-Abliterated", + "name": "Gemma 3 27B IT Abliterated", + "display_name": "Gemma 3 27B IT Abliterated", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 32768, + "output": 96000 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-07-03", + "last_updated": "2025-07-03", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.42, + "output": 0.42 }, "type": "chat" }, { - "id": "sarvan-medium", - "name": "Sarvam Medium", - "display_name": "Sarvam Medium", + "id": "Llama-3.3-70B-Dark-Ages-v0.1", + "name": "Llama 3.3 70B Dark Ages v0.1", + "display_name": "Llama 3.3 70B Dark Ages v0.1", "modalities": { "input": [ "text" @@ -9392,7 +8843,7 @@ ] }, "limit": { - "context": 128000, + "context": 32768, "output": 16384 }, "tool_call": false, @@ -9401,31 +8852,30 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.25, - "output": 0.75 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-thinking:8192", - "name": "Claude 3.7 Sonnet Thinking (8K)", - "display_name": "Claude 3.7 Sonnet Thinking (8K)", + "id": "gemini-3-pro-preview", + "name": "Gemini 3 Pro", + "display_name": "Gemini 3 Pro", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048756, + "output": 65536 }, "tool_call": true, "reasoning": { @@ -9436,88 +8886,64 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" ], - "notes": [ - "Anthropic uses thinking budget tokens" + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 2.992, - "output": 14.994 + "input": 2, + "output": 12 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-05-20", - "name": "Gemini 2.5 Flash 0520", - "display_name": "Gemini 2.5 Flash 0520", + "id": "asi1-mini", + "name": "ASI1 Mini", + "display_name": "ASI1 Mini", "modalities": { "input": [ "text", - "image" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048000, - "output": 65536 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0.15, - "output": 0.6 + "input": 1, + "output": 1 }, "type": "chat" }, { - "id": "GLM-4.5-Air-Derestricted-Iceblink-v2-ReExtract", - "name": "GLM 4.5 Air Derestricted Iceblink v2 ReExtract", - "display_name": "GLM 4.5 Air Derestricted Iceblink v2 ReExtract", + "id": "glm-4-air", + "name": "GLM-4 Air", + "display_name": "GLM-4 Air", "modalities": { "input": [ "text" @@ -9527,8 +8953,8 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 128000, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -9536,229 +8962,170 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-12", - "last_updated": "2025-12-12", + "release_date": "2024-06-05", + "last_updated": "2024-06-05", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.2006, + "output": 0.2006 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Fallen-v1", - "name": "Llama 3.3 70B Fallen v1", - "display_name": "Llama 3.3 70B Fallen v1", + "id": "kimi-thinking-preview", + "name": "Kimi Thinking Preview", + "display_name": "Kimi Thinking Preview", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 128000, "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0.306, - "output": 0.306 + "input": 31.46, + "output": 31.46 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b-thinking", - "name": "Qwen3 VL 235B A22B Thinking", - "display_name": "Qwen3 VL 235B A22B Thinking", + "id": "Meta-Llama-3-1-8B-Instruct-FP8", + "name": "Llama 3.1 8B (decentralized)", + "display_name": "Llama 3.1 8B (decentralized)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.5, - "output": 6 + "input": 0.02, + "output": 0.03 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-thinking:32768", - "name": "Claude 3.7 Sonnet Thinking (32K)", - "display_name": "Claude 3.7 Sonnet Thinking (32K)", + "id": "Llama-3.3-70B-MiraiFanfare", + "name": "Llama 3.3 70b Mirai Fanfare", + "display_name": "Llama 3.3 70b Mirai Fanfare", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-07-15", - "last_updated": "2025-07-15", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.493, + "output": 0.493 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-thinking:1024", - "name": "Claude 3.7 Sonnet Thinking (1K)", - "display_name": "Claude 3.7 Sonnet Thinking (1K)", + "id": "jamba-mini", + "name": "Jamba Mini", + "display_name": "Jamba Mini", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 256000, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.1989, + "output": 0.408 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "qwen3-vl-235b-a22b-instruct-original", + "name": "Qwen3 VL 235B A22B Instruct Original", + "display_name": "Qwen3 VL 235B A22B Instruct Original", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 32768, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.5, + "output": 1.2 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Vulpecula-R1", - "name": "Llama 3.3 70B Vulpecula R1", - "display_name": "Llama 3.3 70B Vulpecula R1", + "id": "GLM-4.5-Air-Derestricted-Steam", + "name": "GLM 4.5 Air Derestricted Steam", + "display_name": "GLM 4.5 Air Derestricted Steam", "modalities": { "input": [ "text" @@ -9768,8 +9135,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 220600, + "output": 65536 }, "tool_call": false, "reasoning": { @@ -9777,8 +9144,8 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { "input": 0.306, "output": 0.306 @@ -9786,9 +9153,9 @@ "type": "chat" }, { - "id": "claude-sonnet-4-thinking:8192", - "name": "Claude 4 Sonnet Thinking (8K)", - "display_name": "Claude 4 Sonnet Thinking (8K)", + "id": "claude-3-5-haiku-20241022", + "name": "Claude 3.5 Haiku", + "display_name": "Claude 3.5 Haiku", "modalities": { "input": [ "text", @@ -9800,34 +9167,27 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 200000, + "output": 8192 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.8, + "output": 4 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "claude-3-5-sonnet-20241022", + "name": "Claude 3.5 Sonnet", + "display_name": "Claude 3.5 Sonnet", "modalities": { "input": [ "text", @@ -9838,47 +9198,27 @@ ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 200000, + "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", "cost": { - "input": 2.5, - "output": 10 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Ignition-v0.1", - "name": "Llama 3.3 70B Ignition v0.1", - "display_name": "Llama 3.3 70B Ignition v0.1", + "id": "KAT-Coder-Pro-V1", + "name": "KAT Coder Pro V1", + "display_name": "KAT Coder Pro V1", "modalities": { "input": [ "text" @@ -9888,8 +9228,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 256000, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -9897,18 +9237,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-10-28", + "last_updated": "2025-10-28", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1.5, + "output": 6 }, "type": "chat" }, { - "id": "glm-4-plus-0111", - "name": "GLM 4 Plus 0111", - "display_name": "GLM 4 Plus 0111", + "id": "venice-uncensored:web", + "name": "Venice Uncensored Web", + "display_name": "Venice Uncensored Web", "modalities": { "input": [ "text" @@ -9918,8 +9258,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 80000, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -9927,41 +9267,44 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2024-05-01", + "last_updated": "2024-05-01", "cost": { - "input": 9.996, - "output": 9.996 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "KAT-Coder-Air-V1", - "name": "KAT Coder Air V1", - "display_name": "KAT Coder Air V1", + "id": "claude-opus-4-5-20251101", + "name": "Claude 4.5 Opus", + "display_name": "Claude 4.5 Opus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-10-28", - "last_updated": "2025-10-28", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { - "input": 0.1, - "output": 0.2 + "input": 4.998, + "output": 25.007 }, "type": "chat" }, @@ -9996,55 +9339,13 @@ "type": "chat" }, { - "id": "deepseek-r1", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", - "cost": { - "input": 0.4, - "output": 1.7 - }, - "type": "chat" - }, - { - "id": "doubao-1-5-thinking-pro-250415", - "name": "Doubao 1.5 Thinking Pro", - "display_name": "Doubao 1.5 Thinking Pro", + "id": "doubao-1-5-thinking-pro-vision-250415", + "name": "Doubao 1.5 Thinking Pro Vision", + "display_name": "Doubao 1.5 Thinking Pro Vision", "modalities": { "input": [ "text", - "pdf" + "image" ], "output": [ "text" @@ -10060,8 +9361,8 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-04-17", - "last_updated": "2025-04-17", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { "input": 0.6, "output": 2.4 @@ -10069,9 +9370,9 @@ "type": "chat" }, { - "id": "sonar-pro", - "name": "Perplexity Pro", - "display_name": "Perplexity Pro", + "id": "sarvan-medium", + "name": "Sarvam Medium", + "display_name": "Sarvam Medium", "modalities": { "input": [ "text" @@ -10081,8 +9382,8 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -10090,51 +9391,53 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.25, + "output": 0.75 }, "type": "chat" }, { - "id": "Gemma-3-27B-it-Abliterated", - "name": "Gemma 3 27B IT Abliterated", - "display_name": "Gemma 3 27B IT Abliterated", + "id": "gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "display_name": "Gemini 2.0 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 96000 + "context": 1000000, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-03", - "last_updated": "2025-07-03", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.42, - "output": 0.42 + "input": 0.0748, + "output": 0.306 }, "type": "chat" }, { - "id": "deepseek-chat-cheaper", - "name": "DeepSeek V3/Chat Cheaper", - "display_name": "DeepSeek V3/Chat Cheaper", + "id": "claude-opus-4-20250514", + "name": "Claude 4 Opus", + "display_name": "Claude 4 Opus", "modalities": { "input": [ "text", + "image", "pdf" ], "output": [ @@ -10142,8 +9445,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 32000 }, "tool_call": true, "reasoning": { @@ -10151,80 +9454,80 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "release_date": "2025-05-14", + "last_updated": "2025-05-14", "cost": { - "input": 0.25, - "output": 0.7 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "gemini-2.0-pro-exp-02-05", - "name": "Gemini 2.0 Pro 0205", - "display_name": "Gemini 2.0 Pro 0205", + "id": "learnlm-1.5-pro-experimental", + "name": "Gemini LearnLM Experimental", + "display_name": "Gemini LearnLM Experimental", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2097152, + "context": 32767, "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2025-02-05", + "release_date": "2024-05-14", + "last_updated": "2024-05-14", "cost": { - "input": 1.989, - "output": 7.956 + "input": 3.502, + "output": 10.506 }, "type": "chat" }, { - "id": "azure-gpt-4o-mini", - "name": "Azure gpt-4o-mini", - "display_name": "Azure gpt-4o-mini", + "id": "qwen-3.6-plus", + "name": "Qwen 3.6 Plus", + "display_name": "Qwen 3.6 Plus", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 991800, + "output": 65536 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.1496, - "output": 0.595 + "input": 0.45, + "output": 2.7 }, "type": "chat" }, { - "id": "Llama-3.3-70B-MS-Nevoria", - "name": "Llama 3.3 70B MS Nevoria", - "display_name": "Llama 3.3 70B MS Nevoria", + "id": "yi-large", + "name": "Yi Large", + "display_name": "Yi Large", "modalities": { "input": [ "text" @@ -10234,8 +9537,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 32000, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -10243,57 +9546,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0.306, - "output": 0.306 + "input": 3.196, + "output": 3.196 }, "type": "chat" }, { - "id": "claude-opus-4-thinking", - "name": "Claude 4 Opus Thinking", - "display_name": "Claude 4 Opus Thinking", + "id": "Baichuan-M2", + "name": "Baichuan M2 32B Medical", + "display_name": "Baichuan M2 32B Medical", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 32768, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-07-15", - "last_updated": "2025-07-15", + "release_date": "2025-08-19", + "last_updated": "2025-08-19", "cost": { - "input": 14.994, - "output": 75.004 + "input": 15.73, + "output": 15.73 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Sapphira-0.1", - "name": "Llama 3.3 70B Sapphira 0.1", - "display_name": "Llama 3.3 70B Sapphira 0.1", + "id": "Llama-3.3-70B-ArliAI-RPMax-v2", + "name": "Llama 3.3 70B ArliAI RPMax v2", + "display_name": "Llama 3.3 70B ArliAI RPMax v2", "modalities": { "input": [ "text" @@ -10312,8 +9606,8 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { "input": 0.306, "output": 0.306 @@ -10321,9 +9615,9 @@ "type": "chat" }, { - "id": "doubao-seed-code-preview-latest", - "name": "Doubao Seed Code Preview", - "display_name": "Doubao Seed Code Preview", + "id": "glm-4-air-0111", + "name": "GLM 4 Air 0111", + "display_name": "GLM 4 Air 0111", "modalities": { "input": [ "text" @@ -10333,83 +9627,52 @@ ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 128000, + "output": 4096 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-01-11", + "last_updated": "2025-01-11", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.1394, + "output": 0.1394 }, "type": "chat" }, { - "id": "qwen-3.6-plus", - "name": "Qwen 3.6 Plus", - "display_name": "Qwen 3.6 Plus", + "id": "claude-sonnet-4-5-20250929", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", "image", - "video" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 991800, - "output": 65536 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", - "cost": { - "input": 0.45, - "output": 2.7 - }, - "type": "chat" - }, - { - "id": "Llama-3.3-70B-ArliAI-RPMax-v1.4", - "name": "Llama 3.3 70B RPMax v1.4", - "display_name": "Llama 3.3 70B RPMax v1.4", - "modalities": { - "input": [ - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 1000000, + "output": 64000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.306, - "output": 0.306 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, @@ -10445,40 +9708,39 @@ "type": "chat" }, { - "id": "glm-4.1v-thinking-flashx", - "name": "GLM 4.1V Thinking FlashX", - "display_name": "GLM 4.1V Thinking FlashX", + "id": "grok-3-mini-fast-beta", + "name": "Grok 3 Mini Fast Beta", + "display_name": "Grok 3 Mini Fast Beta", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 8192 + "context": 131072, + "output": 131072 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0.3, - "output": 0.3 + "input": 0.6, + "output": 4 }, "type": "chat" }, { - "id": "hunyuan-t1-latest", - "name": "Hunyuan T1", - "display_name": "Hunyuan T1", + "id": "deepseek-reasoner-cheaper", + "name": "Deepseek R1 Cheaper", + "display_name": "Deepseek R1 Cheaper", "modalities": { "input": [ "text" @@ -10488,8 +9750,8 @@ ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 128000, + "output": 65536 }, "tool_call": false, "reasoning": { @@ -10497,52 +9759,52 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-03-22", - "last_updated": "2025-03-22", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.17, - "output": 0.66 + "input": 0.4, + "output": 1.7 }, "type": "chat" }, { - "id": "doubao-1-5-thinking-vision-pro-250428", - "name": "Doubao 1.5 Thinking Vision Pro", - "display_name": "Doubao 1.5 Thinking Vision Pro", + "id": "Llama-3.3-70B-Aurora-Borealis", + "name": "Llama 3.3 70B Aurora Borealis", + "display_name": "Llama 3.3 70B Aurora Borealis", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 32768, "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-15", - "last_updated": "2025-05-15", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.55, - "output": 1.43 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "asi1-mini", - "name": "ASI1 Mini", - "display_name": "ASI1 Mini", + "id": "claude-opus-4-thinking", + "name": "Claude 4 Opus Thinking", + "display_name": "Claude 4 Opus Thinking", "modalities": { "input": [ "text", + "image", "pdf" ], "output": [ @@ -10550,27 +9812,34 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } }, "attachment": true, "open_weights": false, - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "release_date": "2025-07-15", + "last_updated": "2025-07-15", "cost": { - "input": 1, - "output": 1 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "ernie-5.0-thinking-latest", - "name": "Ernie 5.0 Thinking", - "display_name": "Ernie 5.0 Thinking", + "id": "gemini-2.0-flash-001", + "name": "Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", "modalities": { "input": [ "text", @@ -10581,28 +9850,27 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 1.1, - "output": 2 + "input": 0.1003, + "output": 0.408 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Incandescent-Malevolence", - "name": "Llama 3.3 70B Incandescent Malevolence", - "display_name": "Llama 3.3 70B Incandescent Malevolence", + "id": "Gemma-3-27B-ArliAI-RPMax-v3", + "name": "Gemma 3 27B RPMax v3", + "display_name": "Gemma 3 27B RPMax v3", "modalities": { "input": [ "text" @@ -10621,8 +9889,8 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-07-03", + "last_updated": "2025-07-03", "cost": { "input": 0.306, "output": 0.306 @@ -10630,69 +9898,89 @@ "type": "chat" }, { - "id": "Llama-3.3-70B-Damascus-R1", - "name": "Damascus R1", - "display_name": "Damascus R1", + "id": "azure-gpt-4o", + "name": "Azure gpt-4o", + "display_name": "Azure gpt-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 128000, "output": 16384 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0.306, - "output": 0.306 + "input": 2.499, + "output": 9.996 }, "type": "chat" }, { - "id": "Gemma-3-27B-Nidum-Uncensored", - "name": "Gemma 3 27B Nidum Uncensored", - "display_name": "Gemma 3 27B Nidum Uncensored", + "id": "gemini-3-pro-preview-thinking", + "name": "Gemini 3 Pro Thinking", + "display_name": "Gemini 3 Pro Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 96000 + "context": 1048756, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.306, - "output": 0.306 + "input": 2, + "output": 12 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-09-2025-thinking", - "name": "Gemini 2.5 Flash Lite Preview (09/2025) – Thinking", - "display_name": "Gemini 2.5 Flash Lite Preview (09/2025) – Thinking", + "id": "claude-3-7-sonnet-thinking", + "name": "Claude 3.7 Sonnet Thinking", + "display_name": "Claude 3.7 Sonnet Thinking", "modalities": { "input": [ "text", @@ -10704,77 +9992,87 @@ ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 200000, + "output": 16000 }, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "budget", "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, + "min": 1024, "unit": "tokens" }, - "summaries": true, - "visibility": "summary", + "interleaved": false, + "summaries": false, + "visibility": "full", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 0.1, - "output": 0.4 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "doubao-seed-2-0-pro-260215", - "name": "Doubao Seed 2.0 Pro", - "display_name": "Doubao Seed 2.0 Pro", + "id": "claude-opus-4-1-thinking:1024", + "name": "Claude 4.1 Opus Thinking (1K)", + "display_name": "Claude 4.1 Opus Thinking (1K)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.782, - "output": 3.876 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "gemini-3-pro-image-preview", - "name": "Gemini 3 Pro Image", - "display_name": "Gemini 3 Pro Image", + "id": "gemini-2.5-flash-preview-05-20:thinking", + "name": "Gemini 2.5 Flash 0520 Thinking", + "display_name": "Gemini 2.5 Flash 0520 Thinking", "modalities": { "input": [ "text", @@ -10785,7 +10083,7 @@ ] }, "limit": { - "context": 1048756, + "context": 1048000, "output": 65536 }, "tool_call": false, @@ -10797,12 +10095,15 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ @@ -10812,78 +10113,88 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 2, - "output": 12 + "input": 0.15, + "output": 3.5 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "Gemma-3-27B-CardProjector-v4", - "name": "Gemma 3 27B CardProjector v4", - "display_name": "Gemma 3 27B CardProjector v4", + "id": "claude-opus-4-thinking:1024", + "name": "Claude 4 Opus Thinking (1K)", + "display_name": "Claude 4 Opus Thinking (1K)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.306, - "output": 0.306 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "jamba-mini-1.7", - "name": "Jamba Mini 1.7", - "display_name": "Jamba Mini 1.7", + "id": "doubao-1.5-vision-pro-32k", + "name": "Doubao 1.5 Vision Pro 32k", + "display_name": "Doubao 1.5 Vision Pro 32k", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 32000, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2025-01-22", + "last_updated": "2025-01-22", "cost": { - "input": 0.1989, - "output": 0.408 + "input": 0.459, + "output": 1.377 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Forgotten-Safeword-3.6", - "name": "Llama 3.3 70B Forgotten Safeword 3.6", - "display_name": "Llama 3.3 70B Forgotten Safeword 3.6", + "id": "Llama-3.3-70B-Fallen-R1-v1", + "name": "Llama 3.3 70B Fallen R1 v1", + "display_name": "Llama 3.3 70B Fallen R1 v1", "modalities": { "input": [ "text" @@ -10911,9 +10222,9 @@ "type": "chat" }, { - "id": "doubao-1-5-thinking-pro-vision-250415", - "name": "Doubao 1.5 Thinking Pro Vision", - "display_name": "Doubao 1.5 Thinking Pro Vision", + "id": "glm-4.1v-thinking-flash", + "name": "GLM 4.1V Thinking Flash", + "display_name": "GLM 4.1V Thinking Flash", "modalities": { "input": [ "text", @@ -10924,8 +10235,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 64000, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -10933,69 +10244,48 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.6, - "output": 2.4 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "gemini-2.5-pro-preview-06-05", - "name": "Gemini 2.5 Pro Preview 0605", - "display_name": "Gemini 2.5 Pro Preview 0605", + "id": "gemini-2.0-flash-thinking-exp-1219", + "name": "Gemini 2.0 Flash Thinking 1219", + "display_name": "Gemini 2.0 Flash Thinking 1219", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 32767, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "release_date": "2024-12-19", + "last_updated": "2024-12-19", "cost": { - "input": 2.5, - "output": 10 + "input": 0.1003, + "output": 0.408 }, "type": "chat" }, { - "id": "gemini-2.0-pro-reasoner", - "name": "Gemini 2.0 Pro Reasoner", - "display_name": "Gemini 2.0 Pro Reasoner", + "id": "Llama-3.3-70B-Magnum-v4-SE-Cirrus-x1-SLERP", + "name": "Llama 3.3 70B Magnum v4 SE Cirrus x1 SLERP", + "display_name": "Llama 3.3 70B Magnum v4 SE Cirrus x1 SLERP", "modalities": { "input": [ "text" @@ -11005,8 +10295,8 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -11014,46 +10304,42 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2025-02-05", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 1.292, - "output": 4.998 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "doubao-seed-2-0-lite-260215", - "name": "Doubao Seed 2.0 Lite", - "display_name": "Doubao Seed 2.0 Lite", + "id": "grok-3-fast-beta", + "name": "Grok 3 Fast Beta", + "display_name": "Grok 3 Fast Beta", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 131072, + "output": 131072 }, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0.1462, - "output": 0.8738 + "input": 5, + "output": 25 }, "type": "chat" }, @@ -11109,39 +10395,40 @@ "type": "chat" }, { - "id": "sonar-deep-research", - "name": "Perplexity Deep Research", - "display_name": "Perplexity Deep Research", + "id": "study_gpt-chatgpt-4o-latest", + "name": "Study Mode", + "display_name": "Study Mode", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 60000, - "output": 128000 + "context": 200000, + "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-02-25", - "last_updated": "2025-02-25", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 3.4, - "output": 13.6 + "input": 4.998, + "output": 14.994 }, "type": "chat" }, { - "id": "Gemma-3-27B-it", - "name": "Gemma 3 27B IT", - "display_name": "Gemma 3 27B IT", + "id": "Llama-3.3-70B-ArliAI-RPMax-v3", + "name": "Llama 3.3 70B ArliAI RPMax v3", + "display_name": "Llama 3.3 70B ArliAI RPMax v3", "modalities": { "input": [ "text" @@ -11160,8 +10447,8 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { "input": 0.306, "output": 0.306 @@ -11169,39 +10456,40 @@ "type": "chat" }, { - "id": "Llama-3.3-70B-GeneticLemonade-Unleashed-v3", - "name": "Llama 3.3 70B GeneticLemonade Unleashed v3", - "display_name": "Llama 3.3 70B GeneticLemonade Unleashed v3", + "id": "qwen-long", + "name": "Qwen Long 10M", + "display_name": "Qwen Long 10M", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 10000000, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-01-25", + "last_updated": "2025-01-25", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.1003, + "output": 0.408 }, "type": "chat" }, { - "id": "Gemma-3-27B-Glitter", - "name": "Gemma 3 27B Glitter", - "display_name": "Gemma 3 27B Glitter", + "id": "Baichuan4-Air", + "name": "Baichuan 4 Air", + "display_name": "Baichuan 4 Air", "modalities": { "input": [ "text" @@ -11212,7 +10500,7 @@ }, "limit": { "context": 32768, - "output": 16384 + "output": 32768 }, "tool_call": false, "reasoning": { @@ -11220,18 +10508,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", + "release_date": "2025-08-19", + "last_updated": "2025-08-19", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.157, + "output": 0.157 }, "type": "chat" }, { - "id": "Llama-3.3-70B-The-Omega-Directive-Unslop-v2.1", - "name": "Llama 3.3 70B Omega Directive Unslop v2.1", - "display_name": "Llama 3.3 70B Omega Directive Unslop v2.1", + "id": "gemini-2.0-flash-exp-image-generation", + "name": "Gemini Text + Image", + "display_name": "Gemini Text + Image", "modalities": { "input": [ "text" @@ -11241,8 +10529,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 32767, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -11250,18 +10538,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "qwen3-30b-a3b-instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", + "id": "v0-1.5-lg", + "name": "v0 1.5 LG", + "display_name": "v0 1.5 LG", "modalities": { "input": [ "text" @@ -11271,8 +10559,8 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 1000000, + "output": 64000 }, "tool_call": false, "reasoning": { @@ -11280,85 +10568,63 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-20", - "last_updated": "2025-02-20", + "release_date": "2025-07-04", + "last_updated": "2025-07-04", "cost": { - "input": 0.2, - "output": 0.5 + "input": 15, + "output": 75 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-09-2025-thinking", - "name": "Gemini 2.5 Flash Preview (09/2025) – Thinking", - "display_name": "Gemini 2.5 Flash Preview (09/2025) – Thinking", + "id": "yi-medium-200k", + "name": "Yi Medium 200k", + "display_name": "Yi Medium 200k", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 200000, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2024-03-01", + "last_updated": "2024-03-01", "cost": { - "input": 0.3, - "output": 2.5 + "input": 2.499, + "output": 2.499 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "claude-opus-4-1-thinking", + "name": "Claude 4.1 Opus Thinking", + "display_name": "Claude 4.1 Opus Thinking", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -11366,37 +10632,23 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "default_enabled": true } }, "attachment": true, "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.3, - "output": 2.5 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "deepclaude", - "name": "DeepClaude", - "display_name": "DeepClaude", + "id": "Mistral-Nemo-12B-Instruct-2407", + "name": "Mistral Nemo 12B Instruct 2407", + "display_name": "Mistral Nemo 12B Instruct 2407", "modalities": { "input": [ "text", @@ -11407,8 +10659,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -11416,18 +10668,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-02-01", - "last_updated": "2025-02-01", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 3, - "output": 15 + "input": 0.01, + "output": 0.01 }, "type": "chat" }, { - "id": "ernie-4.5-8k-preview", - "name": "Ernie 4.5 8k Preview", - "display_name": "Ernie 4.5 8k Preview", + "id": "yi-lightning", + "name": "Yi Lightning", + "display_name": "Yi Lightning", "modalities": { "input": [ "text" @@ -11437,8 +10689,8 @@ ] }, "limit": { - "context": 8000, - "output": 16384 + "context": 12000, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -11446,18 +10698,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "release_date": "2024-10-16", + "last_updated": "2024-10-16", "cost": { - "input": 0.66, - "output": 2.6 + "input": 0.2006, + "output": 0.2006 }, "type": "chat" }, { - "id": "doubao-seed-2-0-mini-260215", - "name": "Doubao Seed 2.0 Mini", - "display_name": "Doubao Seed 2.0 Mini", + "id": "sonar-reasoning-pro", + "name": "Perplexity Reasoning Pro", + "display_name": "Perplexity Reasoning Pro", "modalities": { "input": [ "text" @@ -11467,39 +10719,41 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 127000, + "output": 128000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.0493, - "output": 0.4845 + "input": 2.006, + "output": 7.9985 }, "type": "chat" }, { - "id": "gemini-3-pro-preview-thinking", - "name": "Gemini 3 Pro Thinking", - "display_name": "Gemini 3 Pro Thinking", + "id": "claude-sonnet-4-thinking:8192", + "name": "Claude 4 Sonnet Thinking (8K)", + "display_name": "Claude 4 Sonnet Thinking (8K)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 1000000, + "output": 64000 }, "tool_call": true, "reasoning": { @@ -11509,34 +10763,23 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "default_enabled": true } }, "attachment": true, "open_weights": false, - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 2, - "output": 12 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "Llama-3.3-70B-GeneticLemonade-Opus", - "name": "Llama 3.3 70B GeneticLemonade Opus", - "display_name": "Llama 3.3 70B GeneticLemonade Opus", + "id": "azure-o3-mini", + "name": "Azure o3-mini", + "display_name": "Azure o3-mini", "modalities": { "input": [ "text" @@ -11546,8 +10789,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 200000, + "output": 65536 }, "tool_call": false, "reasoning": { @@ -11555,18 +10798,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1.088, + "output": 4.3996 }, "type": "chat" }, { - "id": "v0-1.5-lg", - "name": "v0 1.5 LG", - "display_name": "v0 1.5 LG", + "id": "Llama-3.3-70B-Argunaut-1-SFT", + "name": "Llama 3.3 70B Argunaut 1 SFT", + "display_name": "Llama 3.3 70B Argunaut 1 SFT", "modalities": { "input": [ "text" @@ -11576,8 +10819,8 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -11585,49 +10828,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-04", - "last_updated": "2025-07-04", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 15, - "output": 75 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "ernie-4.5-turbo-128k", - "name": "Ernie 4.5 Turbo 128k", - "display_name": "Ernie 4.5 Turbo 128k", + "id": "Llama-3.3-70B-Mhnnn-x1", + "name": "Llama 3.3 70B Mhnnn x1", + "display_name": "Llama 3.3 70B Mhnnn x1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 32768, "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-08", - "last_updated": "2025-05-08", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.132, - "output": 0.55 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "KAT-Coder-Pro-V1", - "name": "KAT Coder Pro V1", - "display_name": "KAT Coder Pro V1", + "id": "Llama-3.3-70B-ArliAI-RPMax-v1.4", + "name": "Llama 3.3 70B RPMax v1.4", + "display_name": "Llama 3.3 70B RPMax v1.4", "modalities": { "input": [ "text" @@ -11637,8 +10879,8 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -11646,89 +10888,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-10-28", - "last_updated": "2025-10-28", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 1.5, - "output": 6 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "claude-3-5-sonnet-20240620", - "name": "Claude 3.5 Sonnet Old", - "display_name": "Claude 3.5 Sonnet Old", + "id": "Gemma-3-27B-it", + "name": "Gemma 3 27B IT", + "display_name": "Gemma 3 27B IT", "modalities": { "input": [ - "text", - "image", - "pdf" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 200000, - "output": 8192 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2024-06-20", - "last_updated": "2024-06-20", - "cost": { - "input": 2.992, - "output": 14.994 - }, - "type": "chat" - }, - { - "id": "claude-opus-4-1-thinking:8192", - "name": "Claude 4.1 Opus Thinking (8K)", - "display_name": "Claude 4.1 Opus Thinking (8K)", - "modalities": { - "input": [ - "text", - "image", - "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 32768, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-03-10", + "last_updated": "2025-03-10", "cost": { - "input": 14.994, - "output": 75.004 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "gemini-2.0-flash-exp-image-generation", - "name": "Gemini Text + Image", - "display_name": "Gemini Text + Image", + "id": "GLM-4.5-Air-Derestricted", + "name": "GLM 4.5 Air Derestricted", + "display_name": "GLM 4.5 Air Derestricted", "modalities": { "input": [ "text" @@ -11738,8 +10939,8 @@ ] }, "limit": { - "context": 32767, - "output": 8192 + "context": 202600, + "output": 98304 }, "tool_call": false, "reasoning": { @@ -11747,18 +10948,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Magnum-v4-SE", - "name": "Llama 3.3 70B Magnum v4 SE", - "display_name": "Llama 3.3 70B Magnum v4 SE", + "id": "Baichuan4-Turbo", + "name": "Baichuan 4 Turbo", + "display_name": "Baichuan 4 Turbo", "modalities": { "input": [ "text" @@ -11768,8 +10969,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -11777,18 +10978,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-08-19", + "last_updated": "2025-08-19", "cost": { - "input": 0.306, - "output": 0.306 + "input": 2.42, + "output": 2.42 }, "type": "chat" }, { - "id": "glm-zero-preview", - "name": "GLM Zero Preview", - "display_name": "GLM Zero Preview", + "id": "jamba-mini-1.6", + "name": "Jamba Mini 1.6", + "display_name": "Jamba Mini 1.6", "modalities": { "input": [ "text" @@ -11798,7 +10999,7 @@ ] }, "limit": { - "context": 8000, + "context": 256000, "output": 4096 }, "tool_call": false, @@ -11807,18 +11008,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 1.802, - "output": 1.802 + "input": 0.1989, + "output": 0.408 }, "type": "chat" }, { - "id": "study_gpt-chatgpt-4o-latest", - "name": "Study Mode", - "display_name": "Study Mode", + "id": "qvq-max", + "name": "Qwen: QvQ Max", + "display_name": "Qwen: QvQ Max", "modalities": { "input": [ "text", @@ -11829,8 +11030,8 @@ ] }, "limit": { - "context": 200000, - "output": 16384 + "context": 128000, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -11838,18 +11039,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "release_date": "2025-03-28", + "last_updated": "2025-03-28", "cost": { - "input": 4.998, - "output": 14.994 + "input": 1.4, + "output": 5.3 }, "type": "chat" }, { - "id": "glm-4-airx", - "name": "GLM-4 AirX", - "display_name": "GLM-4 AirX", + "id": "MiniMax-M1", + "name": "MiniMax M1", + "display_name": "MiniMax M1", "modalities": { "input": [ "text" @@ -11859,8 +11060,8 @@ ] }, "limit": { - "context": 8000, - "output": 4096 + "context": 1000000, + "output": 131072 }, "tool_call": false, "reasoning": { @@ -11868,18 +11069,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-06-05", - "last_updated": "2024-06-05", + "release_date": "2025-06-16", + "last_updated": "2025-06-16", "cost": { - "input": 2.006, - "output": 2.006 + "input": 0.1394, + "output": 1.3328 }, "type": "chat" }, { - "id": "step-2-mini", - "name": "Step-2 Mini", - "display_name": "Step-2 Mini", + "id": "qwen3.6-max-preview", + "name": "Qwen3.6 Max Preview", + "display_name": "Qwen3.6 Max Preview", "modalities": { "input": [ "text" @@ -11889,27 +11090,38 @@ ] }, "limit": { - "context": 8000, - "output": 4096 + "context": 245800, + "output": 65536 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2024-07-05", - "last_updated": "2024-07-05", + "release_date": "2026-04-20", + "last_updated": "2026-04-21", "cost": { - "input": 0.2006, - "output": 0.408 + "input": 1.3, + "output": 7.8 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-04-17:thinking", - "name": "Gemini 2.5 Flash Preview Thinking", - "display_name": "Gemini 2.5 Flash Preview Thinking", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", @@ -11950,48 +11162,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-04-17", - "last_updated": "2025-04-17", - "cost": { - "input": 0.15, - "output": 3.5 - }, - "type": "chat" - }, - { - "id": "Llama-3.3-70B-Mokume-Gane-R1", - "name": "Llama 3.3 70B Mokume Gane R1", - "display_name": "Llama 3.3 70B Mokume Gane R1", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32768, - "output": 16384 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "deepseek-reasoner", - "name": "DeepSeek Reasoner", - "display_name": "DeepSeek Reasoner", + "id": "qwen3-max-2026-01-23", + "name": "Qwen3 Max 2026-01-23", + "display_name": "Qwen3 Max 2026-01-23", "modalities": { "input": [ "text" @@ -12001,8 +11183,8 @@ ] }, "limit": { - "context": 64000, - "output": 65536 + "context": 256000, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -12021,18 +11203,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2026-01-26", + "last_updated": "2026-01-26", "cost": { - "input": 0.4, - "output": 1.7 + "input": 1.2002, + "output": 6.001 }, "type": "chat" }, { - "id": "glm-z1-airx", - "name": "GLM Z1 AirX", - "display_name": "GLM Z1 AirX", + "id": "Gemma-3-27B-Nidum-Uncensored", + "name": "Gemma 3 27B Nidum Uncensored", + "display_name": "Gemma 3 27B Nidum Uncensored", "modalities": { "input": [ "text" @@ -12042,27 +11224,27 @@ ] }, "limit": { - "context": 32000, - "output": 16384 + "context": 32768, + "output": 96000 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 0.7, - "output": 0.7 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "jamba-mini-1.6", - "name": "Jamba Mini 1.6", - "display_name": "Jamba Mini 1.6", + "id": "GLM-4.6-Derestricted-v5", + "name": "GLM 4.6 Derestricted v5", + "display_name": "GLM 4.6 Derestricted v5", "modalities": { "input": [ "text" @@ -12072,8 +11254,8 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 131072, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -12081,57 +11263,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.1989, - "output": 0.408 + "input": 0.4, + "output": 1.5 }, "type": "chat" }, { - "id": "claude-opus-4-1-thinking", - "name": "Claude 4.1 Opus Thinking", - "display_name": "Claude 4.1 Opus Thinking", + "id": "glm-4-airx", + "name": "GLM-4 AirX", + "display_name": "GLM-4 AirX", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 8000, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2024-06-05", + "last_updated": "2024-06-05", "cost": { - "input": 14.994, - "output": 75.004 + "input": 2.006, + "output": 2.006 }, "type": "chat" }, { - "id": "grok-3-beta", - "name": "Grok 3 Beta", - "display_name": "Grok 3 Beta", + "id": "doubao-seed-1-6-flash-250615", + "name": "Doubao Seed 1.6 Flash", + "display_name": "Doubao Seed 1.6 Flash", "modalities": { "input": [ "text" @@ -12141,8 +11314,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -12150,18 +11323,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-06-15", + "last_updated": "2025-06-15", "cost": { - "input": 3, - "output": 15 + "input": 0.0374, + "output": 0.374 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Legion-V2.1", - "name": "Llama 3.3 70B Legion V2.1", - "display_name": "Llama 3.3 70B Legion V2.1", + "id": "brave-pro", + "name": "Brave (Pro)", + "display_name": "Brave (Pro)", "modalities": { "input": [ "text" @@ -12171,8 +11344,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -12180,18 +11353,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2023-03-02", + "last_updated": "2024-01-01", "cost": { - "input": 0.306, - "output": 0.306 + "input": 5, + "output": 5 }, "type": "chat" }, { - "id": "sonar", - "name": "Perplexity Simple", - "display_name": "Perplexity Simple", + "id": "Llama-3.3-70B-Sapphira-0.1", + "name": "Llama 3.3 70B Sapphira 0.1", + "display_name": "Llama 3.3 70B Sapphira 0.1", "modalities": { "input": [ "text" @@ -12201,8 +11374,8 @@ ] }, "limit": { - "context": 127000, - "output": 128000 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -12210,45 +11383,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 1.003, - "output": 1.003 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "z-image-turbo", - "name": "Z Image Turbo", - "display_name": "Z Image Turbo", + "id": "Llama-3.3-70B-Incandescent-Malevolence", + "name": "Llama 3.3 70B Incandescent Malevolence", + "display_name": "Llama 3.3 70B Incandescent Malevolence", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 32768, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-27", - "last_updated": "2025-11-27", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.306, + "output": 0.306 + }, "type": "chat" }, { - "id": "GLM-4.5-Air-Derestricted-Iceblink-v2", - "name": "GLM 4.5 Air Derestricted Iceblink v2", - "display_name": "GLM 4.5 Air Derestricted Iceblink v2", + "id": "gemini-2.0-pro-reasoner", + "name": "Gemini 2.0 Pro Reasoner", + "display_name": "Gemini 2.0 Pro Reasoner", "modalities": { "input": [ "text" @@ -12258,7 +11434,7 @@ ] }, "limit": { - "context": 158600, + "context": 128000, "output": 65536 }, "tool_call": false, @@ -12267,18 +11443,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-02-05", + "last_updated": "2025-02-05", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1.292, + "output": 4.998 }, "type": "chat" }, { - "id": "jamba-large", - "name": "Jamba Large", - "display_name": "Jamba Large", + "id": "hunyuan-turbos-20250226", + "name": "Hunyuan Turbo S", + "display_name": "Hunyuan Turbo S", "modalities": { "input": [ "text" @@ -12288,8 +11464,8 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 24000, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -12297,162 +11473,139 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2025-02-27", + "last_updated": "2025-02-27", "cost": { - "input": 1.989, - "output": 7.99 + "input": 0.187, + "output": 0.374 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-reasoner", - "name": "Claude 3.7 Sonnet Reasoner", - "display_name": "Claude 3.7 Sonnet Reasoner", + "id": "doubao-1.5-pro-32k", + "name": "Doubao 1.5 Pro 32k", + "display_name": "Doubao 1.5 Pro 32k", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 32000, "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-03-29", - "last_updated": "2025-03-29", + "release_date": "2025-01-22", + "last_updated": "2025-01-22", "cost": { - "input": 3, - "output": 15 + "input": 0.1343, + "output": 0.3349 }, "type": "chat" }, { - "id": "ernie-4.5-turbo-vl-32k", - "name": "Ernie 4.5 Turbo VL 32k", - "display_name": "Ernie 4.5 Turbo VL 32k", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 16384 + "context": 128000, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-08", - "last_updated": "2025-05-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.495, - "output": 1.43 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "Mistral-Nemo-12B-Instruct-2407", - "name": "Mistral Nemo 12B Instruct 2407", - "display_name": "Mistral Nemo 12B Instruct 2407", + "id": "Llama-3.3-70B-MS-Nevoria", + "name": "Llama 3.3 70B MS Nevoria", + "display_name": "Llama 3.3 70B MS Nevoria", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 16384, + "context": 32768, "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.01, - "output": 0.01 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "doubao-seed-1-6-flash-250615", - "name": "Doubao Seed 1.6 Flash", - "display_name": "Doubao Seed 1.6 Flash", + "id": "ernie-x1-32k", + "name": "Ernie X1 32k", + "display_name": "Ernie X1 32k", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 32000, "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-06-15", - "last_updated": "2025-06-15", + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "cost": { - "input": 0.0374, - "output": 0.374 + "input": 0.33, + "output": 1.32 }, "type": "chat" }, { - "id": "qwq-32b", - "name": "Qwen: QwQ 32B", - "display_name": "Qwen: QwQ 32B", + "id": "auto-model", + "name": "Auto model", + "display_name": "Auto model", "modalities": { "input": [ "text" @@ -12462,82 +11615,73 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1000000, + "output": 1000000 }, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.25599999, - "output": 0.30499999 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Strawberrylemonade-v1.2", - "name": "Llama 3.3 70B StrawberryLemonade v1.2", - "display_name": "Llama 3.3 70B StrawberryLemonade v1.2", + "id": "azure-gpt-4o-mini", + "name": "Azure gpt-4o-mini", + "display_name": "Azure gpt-4o-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 128000, "output": 16384 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.1496, + "output": 0.595 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-04-17", - "name": "Gemini 2.5 Flash Preview", - "display_name": "Gemini 2.5 Flash Preview", + "id": "claude-3-7-sonnet-thinking:128000", + "name": "Claude 3.7 Sonnet Thinking (128K)", + "display_name": "Claude 3.7 Sonnet Thinking (128K)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -12548,34 +11692,34 @@ "default_enabled": true, "mode": "budget", "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, + "min": 1024, "unit": "tokens" }, - "summaries": true, - "visibility": "summary", + "interleaved": false, + "summaries": false, + "visibility": "full", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-04-17", - "last_updated": "2025-04-17", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 0.15, - "output": 0.6 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "ernie-x1-turbo-32k", - "name": "Ernie X1 Turbo 32k", - "display_name": "Ernie X1 Turbo 32k", + "id": "claude-opus-4-thinking:8192", + "name": "Claude 4 Opus Thinking (8K)", + "display_name": "Claude 4 Opus Thinking (8K)", "modalities": { "input": [ "text", @@ -12587,62 +11731,34 @@ ] }, "limit": { - "context": 32000, - "output": 16384 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-08", - "last_updated": "2025-05-08", - "cost": { - "input": 0.165, - "output": 0.66 - }, - "type": "chat" - }, - { - "id": "deepseek-math-v2", - "name": "DeepSeek Math V2", - "display_name": "DeepSeek Math V2", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 65536 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-03", - "last_updated": "2025-12-03", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.6, - "output": 2.2 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Electranova-v1.0", - "name": "Llama 3.3 70B Electranova v1.0", - "display_name": "Llama 3.3 70B Electranova v1.0", + "id": "glm-z1-air", + "name": "GLM Z1 Air", + "display_name": "GLM Z1 Air", "modalities": { "input": [ "text" @@ -12652,85 +11768,80 @@ ] }, "limit": { - "context": 32768, + "context": 32000, "output": 16384 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.07, + "output": 0.07 }, "type": "chat" }, { - "id": "Llama-3.3-70B-ArliAI-RPMax-v2", - "name": "Llama 3.3 70B ArliAI RPMax v2", - "display_name": "Llama 3.3 70B ArliAI RPMax v2", + "id": "claude-3-7-sonnet-20250219", + "name": "Claude 3.7 Sonnet", + "display_name": "Claude 3.7 Sonnet", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 200000, + "output": 16000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.306, - "output": 0.306 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "qwen-image", - "name": "Qwen Image", - "display_name": "Qwen Image", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "type": "imageGeneration" - }, - { - "id": "Llama-3.3-70B-Cu-Mai-R1", - "name": "Llama 3.3 70B Cu Mai R1", - "display_name": "Llama 3.3 70B Cu Mai R1", + "id": "Gemma-3-27B-Big-Tiger-v3", + "name": "Gemma 3 27B Big Tiger v3", + "display_name": "Gemma 3 27B Big Tiger v3", "modalities": { "input": [ "text" @@ -12749,8 +11860,8 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { "input": 0.306, "output": 0.306 @@ -12758,12 +11869,13 @@ "type": "chat" }, { - "id": "GLM-4.5-Air-Derestricted-Iceblink", - "name": "GLM 4.5 Air Derestricted Iceblink", - "display_name": "GLM 4.5 Air Derestricted Iceblink", + "id": "kimi-k2-instruct-fast", + "name": "Kimi K2 0711 Fast", + "display_name": "Kimi K2 0711 Fast", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" @@ -12771,56 +11883,79 @@ }, "limit": { "context": 131072, - "output": 98304 + "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-07-15", + "last_updated": "2025-07-15", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.1, + "output": 2 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Bigger-Body", - "name": "Llama 3.3 70B Bigger Body", - "display_name": "Llama 3.3 70B Bigger Body", + "id": "gemini-2.5-flash-nothinking", + "name": "Gemini 2.5 Flash (No Thinking)", + "display_name": "Gemini 2.5 Flash (No Thinking)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 1048756, + "output": 65536 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "hunyuan-turbos-20250226", - "name": "Hunyuan Turbo S", - "display_name": "Hunyuan Turbo S", + "id": "phi-4-mini-instruct", + "name": "Phi 4 Mini", + "display_name": "Phi 4 Mini", "modalities": { "input": [ "text" @@ -12830,8 +11965,8 @@ ] }, "limit": { - "context": 24000, - "output": 8192 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -12839,18 +11974,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 0.187, - "output": 0.374 + "input": 0.17, + "output": 0.68 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-09-2025", - "name": "Gemini 2.5 Flash Preview (09/2025)", - "display_name": "Gemini 2.5 Flash Preview (09/2025)", + "id": "gemini-2.5-flash-lite-preview-09-2025-thinking", + "name": "Gemini 2.5 Flash Lite Preview (09/2025) – Thinking", + "display_name": "Gemini 2.5 Flash Lite Preview (09/2025) – Thinking", "modalities": { "input": [ "text", @@ -12868,19 +12003,18 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "budget", "budget": { "default": -1, - "min": 0, + "min": 512, "max": 24576, "auto": -1, - "off": 0, "unit": "tokens" }, "summaries": true, @@ -12895,45 +12029,54 @@ "release_date": "2025-09-25", "last_updated": "2025-09-25", "cost": { - "input": 0.3, - "output": 2.5 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "GLM-4.6-Derestricted-v5", - "name": "GLM 4.6 Derestricted v5", - "display_name": "GLM 4.6 Derestricted v5", + "id": "claude-sonnet-4-thinking:64000", + "name": "Claude 4 Sonnet Thinking (64K)", + "display_name": "Claude 4 Sonnet Thinking (64K)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 64000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.4, - "output": 1.5 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "glm-4-plus", - "name": "GLM-4 Plus", - "display_name": "GLM-4 Plus", + "id": "GLM-4.5-Air-Derestricted-Iceblink-ReExtract", + "name": "GLM 4.5 Air Derestricted Iceblink ReExtract", + "display_name": "GLM 4.5 Air Derestricted Iceblink ReExtract", "modalities": { "input": [ "text" @@ -12943,8 +12086,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 98304 }, "tool_call": false, "reasoning": { @@ -12952,48 +12095,46 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-08-01", - "last_updated": "2024-08-01", + "release_date": "2025-12-12", + "last_updated": "2025-12-12", "cost": { - "input": 7.497, - "output": 7.497 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "Gemma-3-27B-Big-Tiger-v3", - "name": "Gemma 3 27B Big Tiger v3", - "display_name": "Gemma 3 27B Big Tiger v3", + "id": "qwen-image", + "name": "Qwen Image", + "display_name": "Qwen Image", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-08", - "last_updated": "2025-08-08", - "cost": { - "input": 0.306, - "output": 0.306 - }, - "type": "chat" + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "type": "imageGeneration" }, { - "id": "brave-research", - "name": "Brave (Research)", - "display_name": "Brave (Research)", + "id": "doubao-seed-1-6-thinking-250615", + "name": "Doubao Seed 1.6 Thinking", + "display_name": "Doubao Seed 1.6 Thinking", "modalities": { "input": [ "text" @@ -13003,7 +12144,7 @@ ] }, "limit": { - "context": 16384, + "context": 256000, "output": 16384 }, "tool_call": false, @@ -13012,45 +12153,54 @@ }, "attachment": false, "open_weights": false, - "release_date": "2023-03-02", - "last_updated": "2024-01-01", + "release_date": "2025-06-15", + "last_updated": "2025-06-15", "cost": { - "input": 5, - "output": 5 + "input": 0.204, + "output": 2.04 }, "type": "chat" }, { - "id": "hidream", - "name": "Hidream", - "display_name": "Hidream", + "id": "MiniMax-M2", + "name": "MiniMax M2", + "display_name": "MiniMax M2", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 131072 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "release_date": "2025-10-25", + "last_updated": "2025-10-25", + "cost": { + "input": 0.17, + "output": 1.53 + }, "type": "chat" }, { - "id": "qwen3-max-2026-01-23", - "name": "Qwen3 Max 2026-01-23", - "display_name": "Qwen3 Max 2026-01-23", + "id": "Llama-3.3-70B-The-Omega-Directive-Unslop-v2.0", + "name": "Llama 3.3 70B Omega Directive Unslop v2.0", + "display_name": "Llama 3.3 70B Omega Directive Unslop v2.0", "modalities": { "input": [ "text" @@ -13060,70 +12210,57 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-01-26", - "last_updated": "2026-01-26", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 1.2002, - "output": 6.001 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "claude-opus-4-1-20250805", - "name": "Claude 4.1 Opus", - "display_name": "Claude 4.1 Opus", + "id": "Llama-3.3-70B-Sapphira-0.2", + "name": "Llama 3.3 70B Sapphira 0.2", + "display_name": "Llama 3.3 70B Sapphira 0.2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 32768, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 14.994, - "output": 75.004 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "claude-sonnet-4-20250514", + "name": "Claude 4 Sonnet", + "display_name": "Claude 4 Sonnet", "modalities": { "input": [ "text", @@ -13144,21 +12281,23 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 1, - "output": 5 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "MiniMax-M1", - "name": "MiniMax M1", - "display_name": "MiniMax M1", + "id": "claude-sonnet-4-thinking", + "name": "Claude 4 Sonnet Thinking", + "display_name": "Claude 4 Sonnet Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -13166,26 +12305,33 @@ }, "limit": { "context": 1000000, - "output": 131072 + "output": 64000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-06-16", - "last_updated": "2025-06-16", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 0.1394, - "output": 1.3328 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "gemini-2.5-flash-nothinking", - "name": "Gemini 2.5 Flash (No Thinking)", - "display_name": "Gemini 2.5 Flash (No Thinking)", + "id": "gemini-2.5-flash-preview-09-2025-thinking", + "name": "Gemini 2.5 Flash Preview (09/2025) – Thinking", + "display_name": "Gemini 2.5 Flash Preview (09/2025) – Thinking", "modalities": { "input": [ "text", @@ -13200,7 +12346,7 @@ "context": 1048756, "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -13227,8 +12373,8 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { "input": 0.3, "output": 2.5 @@ -13236,9 +12382,9 @@ "type": "chat" }, { - "id": "exa-research-pro", - "name": "Exa (Research Pro)", - "display_name": "Exa (Research Pro)", + "id": "ernie-x1-32k-preview", + "name": "Ernie X1 32k", + "display_name": "Ernie X1 32k", "modalities": { "input": [ "text" @@ -13248,7 +12394,7 @@ ] }, "limit": { - "context": 16384, + "context": 32000, "output": 16384 }, "tool_call": false, @@ -13257,100 +12403,29 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-06-04", - "last_updated": "2025-06-04", - "cost": { - "input": 2.5, - "output": 2.5 - }, - "type": "chat" - }, - { - "id": "grok-3-fast-beta", - "name": "Grok 3 Fast Beta", - "display_name": "Grok 3 Fast Beta", - "modalities": { - "input": [ - "text", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131072 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "release_date": "2025-04-03", + "last_updated": "2025-04-03", "cost": { - "input": 5, - "output": 25 + "input": 0.33, + "output": 1.32 }, "type": "chat" }, { - "id": "claude-opus-4-5-20251101:thinking", - "name": "Claude 4.5 Opus Thinking", - "display_name": "Claude 4.5 Opus Thinking", + "id": "qwen-plus", + "name": "Qwen Plus", + "display_name": "Qwen Plus", "modalities": { "input": [ - "text", - "image", - "pdf" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 200000, - "output": 32000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-01", - "last_updated": "2025-11-01", - "cost": { - "input": 4.998, - "output": 25.007 - }, - "type": "chat" - }, - { - "id": "gemini-2.5-pro-exp-03-25", - "name": "Gemini 2.5 Pro Experimental 0325", - "display_name": "Gemini 2.5 Pro Experimental 0325", - "modalities": { - "input": [ - "text", - "image" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 995904, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -13360,41 +12435,31 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 2.5, - "output": 10 + "input": 0.3995, + "output": 1.2002 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-thinking", - "name": "Claude 3.7 Sonnet Thinking", - "display_name": "Claude 3.7 Sonnet Thinking", + "id": "v0-1.0-md", + "name": "v0 1.0 MD", + "display_name": "v0 1.0 MD", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -13402,115 +12467,76 @@ }, "limit": { "context": 200000, - "output": 16000 + "output": 64000 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "release_date": "2025-07-04", + "last_updated": "2025-07-04", "cost": { - "input": 2.992, - "output": 14.994 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "claude-opus-4-thinking:8192", - "name": "Claude 4 Opus Thinking (8K)", - "display_name": "Claude 4 Opus Thinking (8K)", + "id": "Magistral-Small-2506", + "name": "Magistral Small 2506", + "display_name": "Magistral Small 2506", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 32768, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 14.994, - "output": 75.004 + "input": 0.4, + "output": 1.4 }, "type": "chat" }, { - "id": "claude-sonnet-4-thinking:1024", - "name": "Claude 4 Sonnet Thinking (1K)", - "display_name": "Claude 4 Sonnet Thinking (1K)", + "id": "sonar-pro", + "name": "Perplexity Pro", + "display_name": "Perplexity Pro", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 200000, + "output": 128000 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { "input": 2.992, "output": 14.994 @@ -13518,9 +12544,9 @@ "type": "chat" }, { - "id": "Llama-3.3-70B-Magnum-v4-SE-Cirrus-x1-SLERP", - "name": "Llama 3.3 70B Magnum v4 SE Cirrus x1 SLERP", - "display_name": "Llama 3.3 70B Magnum v4 SE Cirrus x1 SLERP", + "id": "Qwen2.5-32B-EVA-v0.2", + "name": "Qwen 2.5 32b EVA", + "display_name": "Qwen 2.5 32b EVA", "modalities": { "input": [ "text" @@ -13530,8 +12556,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 24576, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -13539,18 +12565,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "release_date": "2024-09-01", + "last_updated": "2024-09-01", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.493, + "output": 0.493 }, "type": "chat" }, { - "id": "step-r1-v-mini", - "name": "Step R1 V Mini", - "display_name": "Step R1 V Mini", + "id": "exa-answer", + "name": "Exa (Answer)", + "display_name": "Exa (Answer)", "modalities": { "input": [ "text" @@ -13560,8 +12586,8 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -13569,18 +12595,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-04-08", - "last_updated": "2025-04-08", + "release_date": "2025-06-04", + "last_updated": "2025-06-04", "cost": { "input": 2.5, - "output": 11 + "output": 2.5 }, "type": "chat" }, { - "id": "ernie-x1-32k-preview", - "name": "Ernie X1 32k", - "display_name": "Ernie X1 32k", + "id": "doubao-seed-1-6-250615", + "name": "Doubao Seed 1.6", + "display_name": "Doubao Seed 1.6", "modalities": { "input": [ "text" @@ -13590,7 +12616,7 @@ ] }, "limit": { - "context": 32000, + "context": 256000, "output": 16384 }, "tool_call": false, @@ -13599,18 +12625,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-04-03", - "last_updated": "2025-04-03", + "release_date": "2025-06-15", + "last_updated": "2025-06-15", "cost": { - "input": 0.33, - "output": 1.32 + "input": 0.204, + "output": 0.51 }, "type": "chat" }, { - "id": "Llama-3.3-70B-StrawberryLemonade-v1.0", - "name": "Llama 3.3 70B StrawberryLemonade v1.0", - "display_name": "Llama 3.3 70B StrawberryLemonade v1.0", + "id": "Llama-3.3-70B-Forgotten-Safeword-3.6", + "name": "Llama 3.3 70B Forgotten Safeword 3.6", + "display_name": "Llama 3.3 70B Forgotten Safeword 3.6", "modalities": { "input": [ "text" @@ -13638,9 +12664,9 @@ "type": "chat" }, { - "id": "KAT-Coder-Exp-72B-1010", - "name": "KAT Coder Exp 72B 1010", - "display_name": "KAT Coder Exp 72B 1010", + "id": "KAT-Coder-Air-V1", + "name": "KAT Coder Air V1", + "display_name": "KAT Coder Air V1", "modalities": { "input": [ "text" @@ -13668,131 +12694,99 @@ "type": "chat" }, { - "id": "gemini-2.5-pro-preview-03-25", - "name": "Gemini 2.5 Pro Preview 0325", - "display_name": "Gemini 2.5 Pro Preview 0325", + "id": "phi-4-multimodal-instruct", + "name": "Phi 4 Multimodal", + "display_name": "Phi 4 Multimodal", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 2.5, - "output": 10 + "input": 0.07, + "output": 0.11 }, "type": "chat" }, { - "id": "claude-opus-4-thinking:1024", - "name": "Claude 4 Opus Thinking (1K)", - "display_name": "Claude 4 Opus Thinking (1K)", + "id": "soob3123/GrayLine-Qwen3-8B", + "name": "Grayline Qwen3 8B", + "display_name": "Grayline Qwen3 8B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 16384, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 14.994, - "output": 75.004 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "claude-sonnet-4-20250514", - "name": "Claude 4 Sonnet", - "display_name": "Claude 4 Sonnet", + "id": "soob3123/Veiled-Calla-12B", + "name": "Veiled Calla 12B", + "display_name": "Veiled Calla 12B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-04-13", + "last_updated": "2025-04-13", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Progenitor-V3.3", - "name": "Llama 3.3 70B Progenitor V3.3", - "display_name": "Llama 3.3 70B Progenitor V3.3", + "id": "soob3123/amoral-gemma3-27B-v2", + "name": "Amoral Gemma3 27B v2", + "display_name": "Amoral Gemma3 27B v2", "modalities": { "input": [ "text" @@ -13803,7 +12797,7 @@ }, "limit": { "context": 32768, - "output": 16384 + "output": 8192 }, "tool_call": false, "reasoning": { @@ -13811,18 +12805,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "release_date": "2025-05-23", + "last_updated": "2025-05-23", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "Qwen2.5-32B-EVA-v0.2", - "name": "Qwen 2.5 32b EVA", - "display_name": "Qwen 2.5 32b EVA", + "id": "EVA-UNIT-01/EVA-Qwen2.5-72B-v0.2", + "name": "EVA-Qwen2.5-72B-v0.2", + "display_name": "EVA-Qwen2.5-72B-v0.2", "modalities": { "input": [ "text" @@ -13832,7 +12826,7 @@ ] }, "limit": { - "context": 24576, + "context": 16384, "output": 8192 }, "tool_call": false, @@ -13841,18 +12835,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-09-01", - "last_updated": "2024-09-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.493, - "output": 0.493 + "input": 0.7989999999999999, + "output": 0.7989999999999999 }, "type": "chat" }, { - "id": "brave-pro", - "name": "Brave (Pro)", - "display_name": "Brave (Pro)", + "id": "EVA-UNIT-01/EVA-LLaMA-3.33-70B-v0.1", + "name": "EVA-LLaMA-3.33-70B-v0.1", + "display_name": "EVA-LLaMA-3.33-70B-v0.1", "modalities": { "input": [ "text" @@ -13862,8 +12856,8 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -13871,18 +12865,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2023-03-02", - "last_updated": "2024-01-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 5, - "output": 5 + "input": 2.006, + "output": 2.006 }, "type": "chat" }, { - "id": "step-2-16k-exp", - "name": "Step-2 16k Exp", - "display_name": "Step-2 16k Exp", + "id": "EVA-UNIT-01/EVA-Qwen2.5-32B-v0.2", + "name": "EVA-Qwen2.5-32B-v0.2", + "display_name": "EVA-Qwen2.5-32B-v0.2", "modalities": { "input": [ "text" @@ -13892,7 +12886,7 @@ ] }, "limit": { - "context": 16000, + "context": 16384, "output": 8192 }, "tool_call": false, @@ -13901,18 +12895,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-07-05", - "last_updated": "2024-07-05", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 7.004, - "output": 19.992 + "input": 0.7989999999999999, + "output": 0.7989999999999999 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Fallen-R1-v1", - "name": "Llama 3.3 70B Fallen R1 v1", - "display_name": "Llama 3.3 70B Fallen R1 v1", + "id": "EVA-UNIT-01/EVA-LLaMA-3.33-70B-v0.0", + "name": "EVA Llama 3.33 70B", + "display_name": "EVA Llama 3.33 70B", "modalities": { "input": [ "text" @@ -13922,7 +12916,7 @@ ] }, "limit": { - "context": 32768, + "context": 16384, "output": 16384 }, "tool_call": false, @@ -13931,68 +12925,29 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 0.306, - "output": 0.306 + "input": 2.006, + "output": 2.006 }, "type": "chat" }, { - "id": "claude-sonnet-4-thinking", - "name": "Claude 4 Sonnet Thinking", - "display_name": "Claude 4 Sonnet Thinking", + "id": "Gryphe/MythoMax-L2-13b", + "name": "MythoMax 13B", + "display_name": "MythoMax 13B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-02-24", - "last_updated": "2025-02-24", - "cost": { - "input": 2.992, - "output": 14.994 - }, - "type": "chat" - }, - { - "id": "doubao-1.5-pro-256k", - "name": "Doubao 1.5 Pro 256k", - "display_name": "Doubao 1.5 Pro 256k", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 16384 + "context": 4000, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -14000,22 +12955,21 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-03-12", - "last_updated": "2025-03-12", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 0.799, - "output": 1.445 + "input": 0.1003, + "output": 0.1003 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-20250219", - "name": "Claude 3.7 Sonnet", - "display_name": "Claude 3.7 Sonnet", + "id": "undi95/remm-slerp-l2-13b", + "name": "ReMM SLERP 13B", + "display_name": "ReMM SLERP 13B", "modalities": { "input": [ "text", - "image", "pdf" ], "output": [ @@ -14023,48 +12977,27 @@ ] }, "limit": { - "context": 200000, - "output": 16000 + "context": 6144, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.7989999999999999, + "output": 1.2069999999999999 }, "type": "chat" }, { - "id": "learnlm-1.5-pro-experimental", - "name": "Gemini LearnLM Experimental", - "display_name": "Gemini LearnLM Experimental", + "id": "nothingiisreal/L3.1-70B-Celeste-V0.1-BF16", + "name": "Llama 3.1 70B Celeste v0.1", + "display_name": "Llama 3.1 70B Celeste v0.1", "modalities": { "input": [ "text" @@ -14074,8 +13007,8 @@ ] }, "limit": { - "context": 32767, - "output": 8192 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -14083,18 +13016,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-05-14", - "last_updated": "2024-05-14", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 3.502, - "output": 10.506 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "deepseek-ai/deepseek-v3.2-exp", + "name": "DeepSeek V3.2 Exp", + "display_name": "DeepSeek V3.2 Exp", "modalities": { "input": [ "text" @@ -14104,54 +13037,57 @@ ] }, "limit": { - "context": 128000, + "context": 163840, "output": 65536 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.27999999999999997, + "output": 0.42000000000000004 }, "type": "chat" }, { - "id": "chroma", - "name": "Chroma", - "display_name": "Chroma", + "id": "deepseek-ai/DeepSeek-V3.1:thinking", + "name": "DeepSeek V3.1 Thinking", + "display_name": "DeepSeek V3.1 Thinking", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 65536 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-12", - "last_updated": "2025-08-12", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "cost": { + "input": 0.2, + "output": 0.7 + }, "type": "chat" }, { - "id": "Llama-3.3-70B-Predatorial-Extasy", - "name": "Llama 3.3 70B Predatorial Extasy", - "display_name": "Llama 3.3 70B Predatorial Extasy", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ "text" @@ -14161,27 +13097,39 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 163840 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.4, + "output": 1.7 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Aurora-Borealis", - "name": "Llama 3.3 70B Aurora Borealis", - "display_name": "Llama 3.3 70B Aurora Borealis", + "id": "deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ "text" @@ -14191,57 +13139,58 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-08-02", + "last_updated": "2025-08-02", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.25, + "output": 0.7 }, "type": "chat" }, { - "id": "Llama-3.3-70B-ArliAI-RPMax-v3", - "name": "Llama 3.3 70B ArliAI RPMax v3", - "display_name": "Llama 3.3 70B ArliAI RPMax v3", + "id": "deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 65536 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.2, + "output": 0.7 }, "type": "chat" }, { - "id": "venice-uncensored", - "name": "Venice Uncensored", - "display_name": "Venice Uncensored", + "id": "deepseek-ai/DeepSeek-V3.1-Terminus:thinking", + "name": "DeepSeek V3.1 Terminus (Thinking)", + "display_name": "DeepSeek V3.1 Terminus (Thinking)", "modalities": { "input": [ "text" @@ -14252,57 +13201,57 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 0.4, - "output": 0.4 + "input": 0.25, + "output": 0.7 }, "type": "chat" }, { - "id": "step-3", - "name": "Step-3", - "display_name": "Step-3", + "id": "deepseek-ai/deepseek-v3.2-exp-thinking", + "name": "DeepSeek V3.2 Exp Thinking", + "display_name": "DeepSeek V3.2 Exp Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 163840, + "output": 65536 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-07-31", - "last_updated": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.2499, - "output": 0.6494 + "input": 0.27999999999999997, + "output": 0.42000000000000004 }, "type": "chat" }, { - "id": "Llama-3.3-70B-The-Omega-Directive-Unslop-v2.0", - "name": "Llama 3.3 70B Omega Directive Unslop v2.0", - "display_name": "Llama 3.3 70B Omega Directive Unslop v2.0", + "id": "cohere/command-r-plus-08-2024", + "name": "Cohere: Command R+", + "display_name": "Cohere: Command R+", "modalities": { "input": [ "text" @@ -14312,27 +13261,27 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0.306, - "output": 0.306 + "input": 2.856, + "output": 14.246 }, "type": "chat" }, { - "id": "auto-model", - "name": "Auto model", - "display_name": "Auto model", + "id": "cohere/command-r", + "name": "Cohere: Command R", + "display_name": "Cohere: Command R", "modalities": { "input": [ "text" @@ -14342,8 +13291,8 @@ ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 128000, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -14351,22 +13300,21 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2024-03-11", + "last_updated": "2024-03-11", "cost": { - "input": 0, - "output": 0 + "input": 0.476, + "output": 1.428 }, "type": "chat" }, { - "id": "claude-opus-4-1-thinking:32768", - "name": "Claude 4.1 Opus Thinking (32K)", - "display_name": "Claude 4.1 Opus Thinking (32K)", + "id": "raifle/sorcererlm-8x22b", + "name": "SorcererLM 8x22B", + "display_name": "SorcererLM 8x22B", "modalities": { "input": [ "text", - "image", "pdf" ], "output": [ @@ -14374,34 +13322,27 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 16000, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 14.994, - "output": 75.004 + "input": 4.505, + "output": 4.505 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Shakudo", - "name": "Llama 3.3 70B Shakudo", - "display_name": "Llama 3.3 70B Shakudo", + "id": "inflatebot/MN-12B-Mag-Mell-R1", + "name": "Mag Mell R1", + "display_name": "Mag Mell R1", "modalities": { "input": [ "text" @@ -14411,8 +13352,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 16384, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -14420,18 +13361,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "Baichuan4-Air", - "name": "Baichuan 4 Air", - "display_name": "Baichuan 4 Air", + "id": "TEE/qwen3-30b-a3b-instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507 TEE", + "display_name": "Qwen3 30B A3B Instruct 2507 TEE", "modalities": { "input": [ "text" @@ -14441,7 +13382,7 @@ ] }, "limit": { - "context": 32768, + "context": 262000, "output": 32768 }, "tool_call": false, @@ -14450,49 +13391,54 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-08-19", - "last_updated": "2025-08-19", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 0.157, - "output": 0.157 + "input": 0.15, + "output": 0.44999999999999996 }, "type": "chat" }, { - "id": "kimi-thinking-preview", - "name": "Kimi Thinking Preview", - "display_name": "Kimi Thinking Preview", + "id": "TEE/minimax-m2.1", + "name": "MiniMax M2.1 TEE", + "display_name": "MiniMax M2.1 TEE", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 31.46, - "output": 31.46 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "qwen-turbo", - "name": "Qwen Turbo", - "display_name": "Qwen Turbo", + "id": "TEE/kimi-k2.5", + "name": "Kimi K2.5 TEE", + "display_name": "Kimi K2.5 TEE", "modalities": { "input": [ "text" @@ -14502,8 +13448,8 @@ ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 128000, + "output": 65535 }, "tool_call": false, "reasoning": { @@ -14522,87 +13468,90 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "release_date": "2026-01-29", + "last_updated": "2026-01-29", "cost": { - "input": 0.04998, - "output": 0.2006 + "input": 0.3, + "output": 1.9 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Mhnnn-x1", - "name": "Llama 3.3 70B Mhnnn x1", - "display_name": "Llama 3.3 70B Mhnnn x1", + "id": "TEE/qwen2.5-vl-72b-instruct", + "name": "Qwen2.5 VL 72B TEE", + "display_name": "Qwen2.5 VL 72B TEE", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 65536, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-02-01", + "last_updated": "2025-02-01", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.7, + "output": 0.7 }, "type": "chat" }, { - "id": "claude-opus-4-thinking:32768", - "name": "Claude 4 Opus Thinking (32K)", - "display_name": "Claude 4 Opus Thinking (32K)", + "id": "TEE/deepseek-r1-0528", + "name": "DeepSeek R1 0528 TEE", + "display_name": "DeepSeek R1 0528 TEE", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 65536 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 14.994, - "output": 75.004 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Argunaut-1-SFT", - "name": "Llama 3.3 70B Argunaut 1 SFT", - "display_name": "Llama 3.3 70B Argunaut 1 SFT", + "id": "TEE/deepseek-v3.2", + "name": "DeepSeek V3.2 TEE", + "display_name": "DeepSeek V3.2 TEE", "modalities": { "input": [ "text" @@ -14612,117 +13561,63 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 164000, + "output": 65536 }, "tool_call": false, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", - "cost": { - "input": 0.306, - "output": 0.306 - }, - "type": "chat" - }, - { - "id": "claude-opus-4-1-thinking:1024", - "name": "Claude 4.1 Opus Thinking (1K)", - "display_name": "Claude 4.1 Opus Thinking (1K)", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 32000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 14.994, - "output": 75.004 + "input": 0.5, + "output": 1 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "TEE/kimi-k2.5-thinking", + "name": "Kimi K2.5 Thinking TEE", + "display_name": "Kimi K2.5 Thinking TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 128000, + "output": 65535 }, "tool_call": false, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "release_date": "2026-01-29", + "last_updated": "2026-01-29", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.3, + "output": 1.9 }, "type": "chat" }, { - "id": "phi-4-multimodal-instruct", - "name": "Phi 4 Multimodal", - "display_name": "Phi 4 Multimodal", + "id": "TEE/gemma-3-27b-it", + "name": "Gemma 3 27B TEE", + "display_name": "Gemma 3 27B TEE", "modalities": { "input": [ "text" @@ -14732,8 +13627,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -14741,18 +13636,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "release_date": "2025-03-10", + "last_updated": "2025-03-10", "cost": { - "input": 0.07, - "output": 0.11 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "doubao-seed-2-0-code-preview-260215", - "name": "Doubao Seed 2.0 Code Preview", - "display_name": "Doubao Seed 2.0 Code Preview", + "id": "TEE/qwen3.5-397b-a17b", + "name": "Qwen3.5 397B A17B TEE", + "display_name": "Qwen3.5 397B A17B TEE", "modalities": { "input": [ "text" @@ -14762,27 +13657,38 @@ ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 258048, + "output": 65536 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "release_date": "2026-02-28", + "last_updated": "2026-02-28", "cost": { - "input": 0.782, - "output": 3.893 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "deepseek-reasoner-cheaper", - "name": "Deepseek R1 Cheaper", - "display_name": "Deepseek R1 Cheaper", + "id": "TEE/glm-4.7-flash", + "name": "GLM 4.7 Flash TEE", + "display_name": "GLM 4.7 Flash TEE", "modalities": { "input": [ "text" @@ -14792,27 +13698,32 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 203000, + "output": 65535 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.4, - "output": 1.7 + "input": 0.15, + "output": 0.5 }, "type": "chat" }, { - "id": "exa-answer", - "name": "Exa (Answer)", - "display_name": "Exa (Answer)", + "id": "TEE/glm-4.6", + "name": "GLM 4.6 TEE", + "display_name": "GLM 4.6 TEE", "modalities": { "input": [ "text" @@ -14822,27 +13733,32 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 203000, + "output": 65535 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-06-04", - "last_updated": "2025-06-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 2.5, - "output": 2.5 + "input": 0.75, + "output": 2 }, "type": "chat" }, { - "id": "v0-1.0-md", - "name": "v0 1.0 MD", - "display_name": "v0 1.0 MD", + "id": "TEE/gpt-oss-20b", + "name": "GPT-OSS 20B TEE", + "display_name": "GPT-OSS 20B TEE", "modalities": { "input": [ "text" @@ -14852,58 +13768,62 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-07-04", - "last_updated": "2025-07-04", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 3, - "output": 15 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "glm-4.1v-thinking-flash", - "name": "GLM 4.1V Thinking Flash", - "display_name": "GLM 4.1V Thinking Flash", + "id": "TEE/qwen3-coder", + "name": "Qwen3 Coder 480B TEE", + "display_name": "Qwen3 Coder 480B TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 8192 + "context": 128000, + "output": 32768 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.3, - "output": 0.3 + "input": 1.5, + "output": 2 }, "type": "chat" }, { - "id": "azure-o1", - "name": "Azure o1", - "display_name": "Azure o1", + "id": "TEE/kimi-k2-thinking", + "name": "Kimi K2 Thinking TEE", + "display_name": "Kimi K2 Thinking TEE", "modalities": { "input": [ "text" @@ -14913,27 +13833,38 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 65535 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2024-12-17", - "last_updated": "2024-12-17", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 14.994, - "output": 59.993 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "GLM-4.5-Air-Derestricted", - "name": "GLM 4.5 Air Derestricted", - "display_name": "GLM 4.5 Air Derestricted", + "id": "TEE/deepseek-v3.1", + "name": "DeepSeek V3.1 TEE", + "display_name": "DeepSeek V3.1 TEE", "modalities": { "input": [ "text" @@ -14943,8 +13874,8 @@ ] }, "limit": { - "context": 202600, - "output": 98304 + "context": 164000, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -14952,18 +13883,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1, + "output": 2.5 }, "type": "chat" }, { - "id": "azure-o3-mini", - "name": "Azure o3-mini", - "display_name": "Azure o3-mini", + "id": "TEE/llama3-3-70b", + "name": "Llama 3.3 70B", + "display_name": "Llama 3.3 70B", "modalities": { "input": [ "text" @@ -14973,8 +13904,8 @@ ] }, "limit": { - "context": 200000, - "output": 65536 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -14982,18 +13913,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "release_date": "2025-07-03", + "last_updated": "2025-07-03", "cost": { - "input": 1.088, - "output": 4.3996 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "qwen3.6-max-preview", - "name": "Qwen3.6 Max Preview", - "display_name": "Qwen3.6 Max Preview", + "id": "TEE/glm-4.7", + "name": "GLM 4.7 TEE", + "display_name": "GLM 4.7 TEE", "modalities": { "input": [ "text" @@ -15003,8 +13934,8 @@ ] }, "limit": { - "context": 245800, - "output": 65536 + "context": 131000, + "output": 65535 }, "tool_call": false, "reasoning": { @@ -15023,18 +13954,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2026-04-20", - "last_updated": "2026-04-21", + "release_date": "2026-01-29", + "last_updated": "2026-01-29", "cost": { - "input": 1.3, - "output": 7.8 + "input": 0.85, + "output": 3.3 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Sapphira-0.2", - "name": "Llama 3.3 70B Sapphira 0.2", - "display_name": "Llama 3.3 70B Sapphira 0.2", + "id": "TEE/gpt-oss-120b", + "name": "GPT-OSS 120B TEE", + "display_name": "GPT-OSS 120B TEE", "modalities": { "input": [ "text" @@ -15044,57 +13975,32 @@ ] }, "limit": { - "context": 32768, + "context": 131072, "output": 16384 }, "tool_call": false, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", - "cost": { - "input": 0.306, - "output": 0.306 - }, - "type": "chat" - }, - { - "id": "Llama-3.3-70B-Anthrobomination", - "name": "Llama 3.3 70B Anthrobomination", - "display_name": "Llama 3.3 70B Anthrobomination", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32768, - "output": 16384 + "supported": true }, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.306, - "output": 0.306 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "QwQ-32B-ArliAI-RpR-v1", - "name": "QwQ 32b Arli V1", - "display_name": "QwQ 32b Arli V1", + "id": "TEE/glm-5", + "name": "GLM 5 TEE", + "display_name": "GLM 5 TEE", "modalities": { "input": [ "text" @@ -15104,8 +14010,8 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 203000, + "output": 65535 }, "tool_call": false, "reasoning": { @@ -15124,50 +14030,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.2, - "output": 0.2 + "input": 1.2, + "output": 3.5 }, "type": "chat" }, { - "id": "claude-opus-4-20250514", - "name": "Claude 4 Opus", - "display_name": "Claude 4 Opus", + "id": "mlabonne/NeuralDaredevil-8B-abliterated", + "name": "Neural Daredevil 8B abliterated", + "display_name": "Neural Daredevil 8B abliterated", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-14", - "last_updated": "2025-05-14", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 14.994, - "output": 75.004 + "input": 0.44, + "output": 0.44 }, "type": "chat" }, { - "id": "yi-lightning", - "name": "Yi Lightning", - "display_name": "Yi Lightning", + "id": "MarinaraSpaghetti/NemoMix-Unleashed-12B", + "name": "NemoMix 12B Unleashed", + "display_name": "NemoMix 12B Unleashed", "modalities": { "input": [ "text" @@ -15177,8 +14081,8 @@ ] }, "limit": { - "context": 12000, - "output": 4096 + "context": 32768, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -15186,18 +14090,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-10-16", - "last_updated": "2024-10-16", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.2006, - "output": 0.2006 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Electra-R1", - "name": "Llama 3.3 70B Electra R1", - "display_name": "Llama 3.3 70B Electra R1", + "id": "Alibaba-NLP/Tongyi-DeepResearch-30B-A3B", + "name": "Tongyi DeepResearch 30B A3B", + "display_name": "Tongyi DeepResearch 30B A3B", "modalities": { "input": [ "text" @@ -15207,8 +14111,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 65536 }, "tool_call": false, "reasoning": { @@ -15216,18 +14120,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.08, + "output": 0.24000000000000002 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Forgotten-Abomination-v5.0", - "name": "Llama 3.3 70B Forgotten Abomination v5.0", - "display_name": "Llama 3.3 70B Forgotten Abomination v5.0", + "id": "baseten/Kimi-K2-Instruct-FP4", + "name": "Kimi K2 0711 Instruct FP4", + "display_name": "Kimi K2 0711 Instruct FP4", "modalities": { "input": [ "text" @@ -15237,8 +14141,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 131072 }, "tool_call": false, "reasoning": { @@ -15246,18 +14150,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.1, + "output": 2 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Cirrus-x1", - "name": "Llama 3.3 70B Cirrus x1", - "display_name": "Llama 3.3 70B Cirrus x1", + "id": "deepcogito/cogito-v1-preview-qwen-32B", + "name": "Cogito v1 Preview Qwen 32B", + "display_name": "Cogito v1 Preview Qwen 32B", "modalities": { "input": [ "text" @@ -15267,8 +14171,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -15276,18 +14180,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-05-10", + "last_updated": "2025-05-10", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1.7999999999999998, + "output": 1.7999999999999998 }, "type": "chat" }, { - "id": "grok-3-mini-beta", - "name": "Grok 3 Mini Beta", - "display_name": "Grok 3 Mini Beta", + "id": "deepcogito/cogito-v2.1-671b", + "name": "Cogito v2.1 671B MoE", + "display_name": "Cogito v2.1 671B MoE", "modalities": { "input": [ "text" @@ -15297,96 +14201,101 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "cost": { - "input": 0.3, - "output": 0.5 + "input": 1.25, + "output": 1.25 }, "type": "chat" }, { - "id": "auto-model-standard", - "name": "Auto model (Standard)", - "display_name": "Auto model (Standard)", + "id": "moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 256000, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, - "open_weights": false, - "release_date": "2024-06-01", - "last_updated": "2024-06-01", - "cost": { - "input": 9.996, - "output": 19.992 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-01-26", + "last_updated": "2026-01-26", + "cost": { + "input": 0.3, + "output": 1.9 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929-thinking", - "name": "Claude Sonnet 4.5 Thinking", - "display_name": "Claude Sonnet 4.5 Thinking", + "id": "moonshotai/kimi-k2-thinking-turbo-original", + "name": "Kimi K2 Thinking Turbo Original", + "display_name": "Kimi K2 Thinking Turbo Original", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 256000, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 2.992, - "output": 14.994 + "input": 1.15, + "output": 8 }, "type": "chat" }, { - "id": "v0-1.5-md", - "name": "v0 1.5 MD", - "display_name": "v0 1.5 MD", + "id": "moonshotai/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -15396,27 +14305,27 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 256000, + "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-07-04", - "last_updated": "2025-07-04", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 3, - "output": 15 + "input": 0.1, + "output": 2 }, "type": "chat" }, { - "id": "kimi-k2-instruct-fast", - "name": "Kimi K2 0711 Fast", - "display_name": "Kimi K2 0711 Fast", + "id": "moonshotai/Kimi-Dev-72B", + "name": "Kimi Dev 72B", + "display_name": "Kimi Dev 72B", "modalities": { "input": [ "text", @@ -15427,8 +14336,8 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 128000, + "output": 131072 }, "tool_call": false, "reasoning": { @@ -15436,48 +14345,50 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-07-15", - "last_updated": "2025-07-15", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.1, - "output": 2 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "glm-4-long", - "name": "GLM-4 Long", - "display_name": "GLM-4 Long", + "id": "moonshotai/kimi-k2.5:thinking", + "name": "Kimi K2.5 Thinking", + "display_name": "Kimi K2.5 Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 4096 + "context": 256000, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-08-01", - "last_updated": "2024-08-01", + "release_date": "2026-01-26", + "last_updated": "2026-01-26", "cost": { - "input": 0.2006, - "output": 0.2006 + "input": 0.3, + "output": 1.9 }, "type": "chat" }, { - "id": "jamba-large-1.7", - "name": "Jamba Large 1.7", - "display_name": "Jamba Large 1.7", + "id": "moonshotai/kimi-k2-thinking-original", + "name": "Kimi K2 Thinking Original", + "display_name": "Kimi K2 Thinking Original", "modalities": { "input": [ "text" @@ -15488,30 +14399,30 @@ }, "limit": { "context": 256000, - "output": 4096 + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 1.989, - "output": 7.99 + "input": 0.6, + "output": 2.5 }, "type": "chat" }, { - "id": "qvq-max", - "name": "Qwen: QvQ Max", - "display_name": "Qwen: QvQ Max", + "id": "moonshotai/kimi-k2-instruct-0711", + "name": "Kimi K2 0711", + "display_name": "Kimi K2 0711", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -15521,24 +14432,24 @@ "context": 128000, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-03-28", - "last_updated": "2025-03-28", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", "cost": { - "input": 1.4, - "output": 5.3 + "input": 0.1, + "output": 2 }, "type": "chat" }, { - "id": "gemini-2.0-flash-thinking-exp-1219", - "name": "Gemini 2.0 Flash Thinking 1219", - "display_name": "Gemini 2.0 Flash Thinking 1219", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -15548,27 +14459,68 @@ ] }, "limit": { - "context": 32767, - "output": 8192 + "context": 256000, + "output": 262144 }, - "tool_call": false, + "tool_call": true, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "cost": { + "input": 0.3, + "output": 1.2 + }, + "type": "chat" + }, + { + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 262144 + }, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-12-19", - "last_updated": "2024-12-19", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.1003, - "output": 0.408 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash Lite", - "display_name": "Gemini 2.0 Flash Lite", + "id": "moonshotai/kimi-k2.6:thinking", + "name": "Kimi K2.6 Thinking", + "display_name": "Kimi K2.6 Thinking", "modalities": { "input": [ "text", @@ -15579,57 +14531,64 @@ ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 256000, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": true, + "release_date": "2026-04-16", + "last_updated": "2026-04-21", "cost": { - "input": 0.0748, - "output": 0.306 + "input": 0.53, + "output": 2.73 }, "type": "chat" }, { - "id": "azure-gpt-4-turbo", - "name": "Azure gpt-4-turbo", - "display_name": "Azure gpt-4-turbo", + "id": "moonshotai/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, - "open_weights": false, - "release_date": "2023-11-06", - "last_updated": "2024-01-01", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-04-16", + "last_updated": "2026-04-21", "cost": { - "input": 9.996, - "output": 30.005 + "input": 0.53, + "output": 2.73 }, "type": "chat" }, { - "id": "Baichuan-M2", - "name": "Baichuan M2 32B Medical", - "display_name": "Baichuan M2 32B Medical", + "id": "Envoid/Llama-3.05-NT-Storybreaker-Ministral-70B", + "name": "Llama 3.05 Storybreaker Ministral 70b", + "display_name": "Llama 3.05 Storybreaker Ministral 70b", "modalities": { "input": [ "text" @@ -15639,8 +14598,8 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 16384, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -15648,49 +14607,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-08-19", - "last_updated": "2025-08-19", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 15.73, - "output": 15.73 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "qwen-long", - "name": "Qwen Long 10M", - "display_name": "Qwen Long 10M", + "id": "Envoid/Llama-3.05-Nemotron-Tenyxchat-Storybreaker-70B", + "name": "Nemotron Tenyxchat Storybreaker 70b", + "display_name": "Nemotron Tenyxchat Storybreaker 70b", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 10000000, + "context": 16384, "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-01-25", - "last_updated": "2025-01-25", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.1003, - "output": 0.408 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "sonar-reasoning-pro", - "name": "Perplexity Reasoning Pro", - "display_name": "Perplexity Reasoning Pro", + "id": "z-ai/glm-4.6:thinking", + "name": "GLM 4.6 Thinking", + "display_name": "GLM 4.6 Thinking", "modalities": { "input": [ "text" @@ -15700,28 +14658,28 @@ ] }, "limit": { - "context": 127000, - "output": 128000 + "context": 200000, + "output": 65535 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 2.006, - "output": 7.9985 + "input": 0.4, + "output": 1.5 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-05-20:thinking", - "name": "Gemini 2.5 Flash 0520 Thinking", - "display_name": "Gemini 2.5 Flash 0520 Thinking", + "id": "z-ai/glm-4.5v", + "name": "GLM 4.5V", + "display_name": "GLM 4.5V", "modalities": { "input": [ "text", @@ -15732,48 +14690,28 @@ ] }, "limit": { - "context": 1048000, - "output": 65536 + "context": 64000, + "output": 96000 }, "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, "open_weights": false, - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "release_date": "2025-11-22", + "last_updated": "2025-11-22", "cost": { - "input": 0.15, - "output": 3.5 + "input": 0.6, + "output": 1.7999999999999998 }, "type": "chat" }, { - "id": "GLM-4.5-Air-Derestricted-Steam-ReExtract", - "name": "GLM 4.5 Air Derestricted Steam ReExtract", - "display_name": "GLM 4.5 Air Derestricted Steam ReExtract", + "id": "z-ai/glm-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ "text" @@ -15783,60 +14721,69 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 200000, + "output": 65535 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-12-12", - "last_updated": "2025-12-12", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.4, + "output": 1.5 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Dark-Ages-v0.1", - "name": "Llama 3.3 70B Dark Ages v0.1", - "display_name": "Llama 3.3 70B Dark Ages v0.1", + "id": "z-ai/glm-4.5v:thinking", + "name": "GLM 4.5V Thinking", + "display_name": "GLM 4.5V Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 64000, + "output": 96000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-11-22", + "last_updated": "2025-11-22", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.6, + "output": 1.7999999999999998 }, "type": "chat" }, { - "id": "Baichuan4-Turbo", - "name": "Baichuan 4 Turbo", - "display_name": "Baichuan 4 Turbo", + "id": "openai/chatgpt-4o-latest", + "name": "ChatGPT 4o", + "display_name": "ChatGPT 4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -15844,26 +14791,26 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 16384 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-19", - "last_updated": "2025-08-19", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 2.42, - "output": 2.42 + "input": 4.998, + "output": 14.993999999999998 }, "type": "chat" }, { - "id": "doubao-1.5-vision-pro-32k", - "name": "Doubao 1.5 Vision Pro 32k", - "display_name": "Doubao 1.5 Vision Pro 32k", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ "text", @@ -15874,8 +14821,8 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -15883,91 +14830,103 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-01-22", - "last_updated": "2025-01-22", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0.459, - "output": 1.377 + "input": 2.499, + "output": 9.996 }, "type": "chat" }, { - "id": "alibaba/qwen3.6-flash", - "name": "Qwen3.6 Flash", - "display_name": "Qwen3.6 Flash", + "id": "openai/gpt-4o-mini-search-preview", + "name": "GPT-4o mini Search Preview", + "display_name": "GPT-4o mini Search Preview", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 991800, - "output": 65536 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.19, - "output": 1.16 + "input": 0.088, + "output": 0.35 }, "type": "chat" }, { - "id": "inflection/inflection-3-pi", - "name": "Inflection 3 Pi", - "display_name": "Inflection 3 Pi", + "id": "openai/gpt-5.2", + "name": "GPT 5.2", + "display_name": "GPT 5.2", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-10-11", - "last_updated": "2024-10-11", + "release_date": "2026-01-01", + "last_updated": "2026-01-01", "cost": { - "input": 2.499, - "output": 9.996 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "inflection/inflection-3-productivity", - "name": "Inflection 3 Productivity", - "display_name": "Inflection 3 Productivity", + "id": "openai/gpt-3.5-turbo", + "name": "GPT-3.5 Turbo", + "display_name": "GPT-3.5 Turbo", "modalities": { "input": [ "text" @@ -15977,7 +14936,7 @@ ] }, "limit": { - "context": 8000, + "context": 16385, "output": 4096 }, "tool_call": false, @@ -15986,18 +14945,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-10-11", - "last_updated": "2024-10-11", + "release_date": "2022-11-30", + "last_updated": "2024-01-01", "cost": { - "input": 2.499, - "output": 9.996 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "essentialai/rnj-1-instruct", - "name": "RNJ-1 Instruct 8B", - "display_name": "RNJ-1 Instruct 8B", + "id": "openai/o3-pro-2025-06-10", + "name": "OpenAI o3-pro (2025-06-10)", + "display_name": "OpenAI o3-pro (2025-06-10)", "modalities": { "input": [ "text" @@ -16007,27 +14966,42 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 100000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2025-12-13", - "last_updated": "2025-12-13", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", "cost": { - "input": 0.15, - "output": 0.15 + "input": 9.996, + "output": 19.992 }, "type": "chat" }, { - "id": "LLM360/K2-Think", - "name": "K2-Think", - "display_name": "K2-Think", + "id": "openai/o1-preview", + "name": "OpenAI o1-preview", + "display_name": "OpenAI o1-preview", "modalities": { "input": [ "text" @@ -16042,22 +15016,37 @@ }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 0.17, - "output": 0.68 + "input": 14.993999999999998, + "output": 59.993 }, "type": "chat" }, { - "id": "TEE/kimi-k2.5", - "name": "Kimi K2.5 TEE", - "display_name": "Kimi K2.5 TEE", + "id": "openai/gpt-5.1-2025-11-13", + "name": "GPT-5.1 (2025-11-13)", + "display_name": "GPT-5.1 (2025-11-13)", "modalities": { "input": [ "text" @@ -16067,291 +15056,339 @@ ] }, "limit": { - "context": 128000, - "output": 65535 + "context": 1000000, + "output": 32768 }, "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, "open_weights": false, - "release_date": "2026-01-29", - "last_updated": "2026-01-29", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.3, - "output": 1.9 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "TEE/glm-4.7", - "name": "GLM 4.7 TEE", - "display_name": "GLM 4.7 TEE", + "id": "openai/gpt-5-chat-latest", + "name": "GPT 5 Chat", + "display_name": "GPT 5 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 65535 + "context": 400000, + "output": 128000 }, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-01-29", - "last_updated": "2026-01-29", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.85, - "output": 3.3 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "TEE/qwen3.5-397b-a17b", - "name": "Qwen3.5 397B A17B TEE", - "display_name": "Qwen3.5 397B A17B TEE", + "id": "openai/gpt-5.1-codex-mini", + "name": "GPT 5.1 Codex Mini", + "display_name": "GPT 5.1 Codex Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 258048, - "output": 65536 + "context": 400000, + "output": 128000 }, "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-28", - "last_updated": "2026-02-28", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.6, - "output": 3.6 + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "TEE/glm-5", - "name": "GLM 5 TEE", - "display_name": "GLM 5 TEE", + "id": "openai/gpt-5.2-pro", + "name": "GPT 5.2 Pro", + "display_name": "GPT 5.2 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 203000, - "output": 65535 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2026-01-01", + "last_updated": "2026-01-01", "cost": { - "input": 1.2, - "output": 3.5 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "TEE/qwen2.5-vl-72b-instruct", - "name": "Qwen2.5 VL 72B TEE", - "display_name": "Qwen2.5 VL 72B TEE", + "id": "openai/gpt-5-codex", + "name": "GPT-5 Codex", + "display_name": "GPT-5 Codex", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 256000, + "output": 32768 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-02-01", - "last_updated": "2025-02-01", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.7, - "output": 0.7 + "input": 9.996, + "output": 19.992 }, "type": "chat" }, { - "id": "TEE/minimax-m2.1", - "name": "MiniMax M2.1 TEE", - "display_name": "MiniMax M2.1 TEE", + "id": "openai/gpt-5.1-chat", + "name": "GPT 5.1 Chat", + "display_name": "GPT 5.1 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 400000, + "output": 128000 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.3, - "output": 1.2 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "TEE/qwen3-30b-a3b-instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507 TEE", - "display_name": "Qwen3 30B A3B Instruct 2507 TEE", + "id": "openai/gpt-5.1-chat-latest", + "name": "GPT 5.1 Chat (Latest)", + "display_name": "GPT 5.1 Chat (Latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 32768 + "context": 400000, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.15, - "output": 0.44999999999999996 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "TEE/deepseek-v3.1", - "name": "DeepSeek V3.1 TEE", - "display_name": "DeepSeek V3.1 TEE", + "id": "openai/gpt-4.1", + "name": "GPT 4.1", + "display_name": "GPT 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 8192 + "context": 1047576, + "output": 32768 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "release_date": "2025-09-10", + "last_updated": "2025-09-10", "cost": { - "input": 1, - "output": 2.5 + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "TEE/llama3-3-70b", - "name": "Llama 3.3 70B", - "display_name": "Llama 3.3 70B", + "id": "openai/gpt-4o-search-preview", + "name": "GPT-4o Search Preview", + "display_name": "GPT-4o Search Preview", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -16365,20 +15402,20 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-03", - "last_updated": "2025-07-03", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 2, - "output": 2 + "input": 1.47, + "output": 5.88 }, "type": "chat" }, { - "id": "TEE/glm-4.6", - "name": "GLM 4.6 TEE", - "display_name": "GLM 4.6 TEE", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -16388,12 +15425,13 @@ ] }, "limit": { - "context": 203000, - "output": 65535 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -16402,18 +15440,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.75, - "output": 2 + "input": 0.04, + "output": 0.15 }, "type": "chat" }, { - "id": "TEE/kimi-k2.5-thinking", - "name": "Kimi K2.5 Thinking TEE", - "display_name": "Kimi K2.5 Thinking TEE", + "id": "openai/gpt-oss-safeguard-20b", + "name": "GPT OSS Safeguard 20B", + "display_name": "GPT OSS Safeguard 20B", "modalities": { "input": [ "text" @@ -16424,7 +15462,7 @@ }, "limit": { "context": 128000, - "output": 65535 + "output": 16384 }, "tool_call": false, "reasoning": { @@ -16433,83 +15471,96 @@ }, "attachment": false, "open_weights": false, - "release_date": "2026-01-29", - "last_updated": "2026-01-29", + "release_date": "2025-10-29", + "last_updated": "2025-10-29", "cost": { - "input": 0.3, - "output": 1.9 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "TEE/gemma-3-27b-it", - "name": "Gemma 3 27B TEE", - "display_name": "Gemma 3 27B TEE", + "id": "openai/gpt-5-pro", + "name": "GPT 5 Pro", + "display_name": "GPT 5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", - "cost": { - "input": 0.2, - "output": 0.8 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "TEE/deepseek-v3.2", - "name": "DeepSeek V3.2 TEE", - "display_name": "DeepSeek V3.2 TEE", + "id": "openai/gpt-4.1-mini", + "name": "GPT 4.1 Mini", + "display_name": "GPT 4.1 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 65536 + "context": 1047576, + "output": 32768 }, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.5, - "output": 1 + "input": 0.4, + "output": 1.6 }, "type": "chat" }, { - "id": "TEE/gpt-oss-20b", - "name": "GPT-OSS 20B TEE", - "display_name": "GPT-OSS 20B TEE", + "id": "openai/gpt-4-turbo-preview", + "name": "GPT-4 Turbo Preview", + "display_name": "GPT-4 Turbo Preview", "modalities": { "input": [ "text" @@ -16519,176 +15570,216 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4096 }, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2023-11-06", + "last_updated": "2024-01-01", "cost": { - "input": 0.2, - "output": 0.8 + "input": 9.996, + "output": 30.004999999999995 }, "type": "chat" }, { - "id": "TEE/qwen3-coder", - "name": "Qwen3 Coder 480B TEE", - "display_name": "Qwen3 Coder 480B TEE", + "id": "openai/gpt-5.1", + "name": "GPT 5.1", + "display_name": "GPT 5.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 1.5, - "output": 2 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "TEE/glm-4.7-flash", - "name": "GLM 4.7 Flash TEE", - "display_name": "GLM 4.7 Flash TEE", + "id": "openai/gpt-5-nano", + "name": "GPT 5 Nano", + "display_name": "GPT 5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 203000, - "output": 65535 + "context": 400000, + "output": 128000 }, "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.15, - "output": 0.5 + "input": 0.05, + "output": 0.4 }, "type": "chat" }, { - "id": "TEE/gpt-oss-120b", - "name": "GPT-OSS 120B TEE", - "display_name": "GPT-OSS 120B TEE", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 128000, "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 2, - "output": 2 + "input": 0.1496, + "output": 0.595 }, "type": "chat" }, { - "id": "TEE/deepseek-r1-0528", - "name": "DeepSeek R1 0528 TEE", - "display_name": "DeepSeek R1 0528 TEE", + "id": "openai/o1-pro", + "name": "OpenAI o1 Pro", + "display_name": "OpenAI o1 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 200000, + "output": 100000 }, "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "release_date": "2025-01-25", + "last_updated": "2025-01-25", "cost": { - "input": 2, - "output": 2 + "input": 150, + "output": 600 }, "type": "chat" }, { - "id": "TEE/kimi-k2-thinking", - "name": "Kimi K2 Thinking TEE", - "display_name": "Kimi K2 Thinking TEE", + "id": "openai/gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -16696,37 +15787,26 @@ }, "limit": { "context": 128000, - "output": 65535 + "output": 4096 }, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "release_date": "2023-11-06", + "last_updated": "2024-01-01", "cost": { - "input": 2, - "output": 2 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "CrucibleLab/L3.3-70B-Loki-V2.0", - "name": "L3.3 70B Loki v2.0", - "display_name": "L3.3 70B Loki v2.0", + "id": "openai/o3-mini-low", + "name": "OpenAI o3-mini (Low)", + "display_name": "OpenAI o3-mini (Low)", "modalities": { "input": [ "text" @@ -16736,59 +15816,87 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 200000, + "output": 100000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2026-01-22", - "last_updated": "2026-01-22", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 9.996, + "output": 19.992 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2:thinking", - "name": "DeepSeek V3.2 Thinking", - "display_name": "DeepSeek V3.2 Thinking", + "id": "openai/o1", + "name": "OpenAI o1", + "display_name": "OpenAI o1", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 163000, - "output": 65536 + "context": 200000, + "output": 100000 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2024-12-17", + "last_updated": "2024-12-17", "cost": { - "input": 0.27999999999999997, - "output": 0.42000000000000004 + "input": 14.993999999999998, + "output": 59.993 }, "type": "chat" }, { - "id": "deepseek/deepseek-prover-v2-671b", - "name": "DeepSeek Prover v2 671B", - "display_name": "DeepSeek Prover v2 671B", + "id": "openai/o3-mini-high", + "name": "OpenAI o3-mini (High)", + "display_name": "OpenAI o3-mini (High)", "modalities": { "input": [ "text" @@ -16798,30 +15906,46 @@ ] }, "limit": { - "context": 160000, - "output": 16384 + "context": 200000, + "output": 100000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-04-30", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 1, - "output": 2.5 + "input": 0.64, + "output": 2.588 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-speciale", - "name": "DeepSeek V3.2 Speciale", - "display_name": "DeepSeek V3.2 Speciale", + "id": "openai/gpt-5.1-codex-max", + "name": "GPT 5.1 Codex Max", + "display_name": "GPT 5.1 Codex Max", "modalities": { "input": [ "text", + "image", "pdf" ], "output": [ @@ -16829,69 +15953,94 @@ ] }, "limit": { - "context": 163000, - "output": 65536 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.27999999999999997, - "output": 0.42000000000000004 + "input": 2.5, + "output": 20 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "openai/o4-mini-high", + "name": "OpenAI o4-mini high", + "display_name": "OpenAI o4-mini high", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 163000, - "output": 65536 + "context": 200000, + "output": 100000 }, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.27999999999999997, - "output": 0.42000000000000004 + "input": 1.1, + "output": 4.4 }, "type": "chat" }, { - "id": "Doctor-Shotgun/MS3.2-24B-Magnum-Diamond", - "name": "MS3.2 24B Magnum Diamond", - "display_name": "MS3.2 24B Magnum Diamond", + "id": "openai/o4-mini-deep-research", + "name": "OpenAI o4-mini Deep Research", + "display_name": "OpenAI o4-mini Deep Research", "modalities": { "input": [ "text" @@ -16901,30 +16050,46 @@ ] }, "limit": { - "context": 16384, - "output": 32768 + "context": 200000, + "output": 100000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 9.996, + "output": 19.992 }, "type": "chat" }, { - "id": "NeverSleep/Llama-3-Lumimaid-70B-v0.1", - "name": "Lumimaid 70b", - "display_name": "Lumimaid 70b", + "id": "openai/gpt-4.1-nano", + "name": "GPT 4.1 Nano", + "display_name": "GPT 4.1 Nano", "modalities": { "input": [ "text", + "image", "pdf" ], "output": [ @@ -16932,8 +16097,8 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 1047576, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -16941,18 +16106,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 2.006, - "output": 2.006 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "NeverSleep/Lumimaid-v0.2-70B", - "name": "Lumimaid v0.2", - "display_name": "Lumimaid v0.2", + "id": "openai/o4-mini", + "name": "OpenAI o4-mini", + "display_name": "OpenAI o4-mini", "modalities": { "input": [ "text" @@ -16962,147 +16127,233 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 200000, + "output": 100000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 1, - "output": 1.5 + "input": 1.1, + "output": 4.4 }, "type": "chat" }, { - "id": "Steelskull/L3.3-Cu-Mai-R1-70b", - "name": "Llama 3.3 70B Cu Mai", - "display_name": "Llama 3.3 70B Cu Mai", + "id": "openai/gpt-5.1-codex", + "name": "GPT 5.1 Codex", + "display_name": "GPT 5.1 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 400000, + "output": 128000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "Steelskull/L3.3-Nevoria-R1-70b", - "name": "Steelskull Nevoria R1 70b", - "display_name": "Steelskull Nevoria R1 70b", + "id": "openai/gpt-4o-2024-11-20", + "name": "GPT-4o (2024-11-20)", + "display_name": "GPT-4o (2024-11-20)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, + "context": 128000, "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "Steelskull/L3.3-MS-Evayale-70B", - "name": "Evayale 70b ", - "display_name": "Evayale 70b ", + "id": "openai/gpt-5.2-codex", + "name": "GPT 5.2 Codex", + "display_name": "GPT 5.2 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "Steelskull/L3.3-Electra-R1-70b", - "name": "Steelskull Electra R1 70b", - "display_name": "Steelskull Electra R1 70b", + "id": "openai/gpt-5-mini", + "name": "GPT 5 Mini", + "display_name": "GPT 5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 400000, + "output": 128000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.69989, - "output": 0.69989 + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "Steelskull/L3.3-MS-Nevoria-70b", - "name": "Steelskull Nevoria 70b", - "display_name": "Steelskull Nevoria 70b", + "id": "openai/o3-mini", + "name": "OpenAI o3-mini", + "display_name": "OpenAI o3-mini", "modalities": { "input": [ "text" @@ -17112,87 +16363,105 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 200000, + "output": 100000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 1.1, + "output": 4.4 }, "type": "chat" }, { - "id": "Steelskull/L3.3-MS-Evalebis-70b", - "name": "MS Evalebis 70b", - "display_name": "MS Evalebis 70b", + "id": "openai/gpt-5.2-chat", + "name": "GPT 5.2 Chat", + "display_name": "GPT 5.2 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, + "context": 400000, "output": 16384 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2026-01-01", + "last_updated": "2026-01-01", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "miromind-ai/mirothinker-v1.5-235b", - "name": "MiroThinker v1.5 235B", - "display_name": "MiroThinker v1.5 235B", + "id": "openai/gpt-4o-2024-08-06", + "name": "GPT-4o (2024-08-06)", + "display_name": "GPT-4o (2024-08-06)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 4000 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-01-07", - "last_updated": "2026-01-07", + "release_date": "2024-08-06", + "last_updated": "2024-08-06", "cost": { - "input": 0.3, - "output": 1.2 + "input": 2.499, + "output": 9.996 }, "type": "chat" }, { - "id": "pamanseau/OpenReasoning-Nemotron-32B", - "name": "OpenReasoning Nemotron 32B", - "display_name": "OpenReasoning Nemotron 32B", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -17202,28 +16471,33 @@ ] }, "limit": { - "context": 32768, - "output": 65536 + "context": 128000, + "output": 16384 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": false, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.05, + "output": 0.25 }, "type": "chat" }, { - "id": "arcee-ai/trinity-mini", - "name": "Trinity Mini", - "display_name": "Trinity Mini", + "id": "openai/o3", + "name": "OpenAI o3", + "display_name": "OpenAI o3", "modalities": { "input": [ "text" @@ -17233,27 +16507,42 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 100000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.045000000000000005, - "output": 0.15 + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "arcee-ai/trinity-large", - "name": "Trinity Large", - "display_name": "Trinity Large", + "id": "openai/o3-deep-research", + "name": "OpenAI o3 Deep Research", + "display_name": "OpenAI o3 Deep Research", "modalities": { "input": [ "text" @@ -17263,57 +16552,96 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 100000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.25, - "output": 1 + "input": 9.996, + "output": 19.992 }, "type": "chat" }, { - "id": "cognitivecomputations/dolphin-2.9.2-qwen2-72b", - "name": "Dolphin 72b", - "display_name": "Dolphin 72b", + "id": "openai/gpt-5", + "name": "GPT 5", + "display_name": "GPT 5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "deepcogito/cogito-v1-preview-qwen-32B", - "name": "Cogito v1 Preview Qwen 32B", - "display_name": "Cogito v1 Preview Qwen 32B", + "id": "zai-org/glm-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ "text" @@ -17323,27 +16651,33 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-10", - "last_updated": "2025-05-10", + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 1.7999999999999998, - "output": 1.7999999999999998 + "input": 0.3, + "output": 2.55 }, "type": "chat" }, { - "id": "deepcogito/cogito-v2.1-671b", - "name": "Cogito v2.1 671B MoE", - "display_name": "Cogito v2.1 671B MoE", + "id": "zai-org/glm-5:thinking", + "name": "GLM 5 Thinking", + "display_name": "GLM 5 Thinking", "modalities": { "input": [ "text" @@ -17353,28 +16687,28 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 1.25, - "output": 1.25 + "input": 0.3, + "output": 2.55 }, "type": "chat" }, { - "id": "Salesforce/Llama-xLAM-2-70b-fc-r", - "name": "Llama-xLAM-2 70B fc-r", - "display_name": "Llama-xLAM-2 70B fc-r", + "id": "zai-org/glm-4.7-flash", + "name": "GLM 4.7 Flash", + "display_name": "GLM 4.7 Flash", "modalities": { "input": [ "text" @@ -17384,27 +16718,33 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-13", - "last_updated": "2025-04-13", + "open_weights": true, + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 2.5, - "output": 2.5 + "input": 0.07, + "output": 0.4 }, "type": "chat" }, { - "id": "soob3123/Veiled-Calla-12B", - "name": "Veiled Calla 12B", - "display_name": "Veiled Calla 12B", + "id": "zai-org/glm-5.1:thinking", + "name": "GLM 5.1 Thinking", + "display_name": "GLM 5.1 Thinking", "modalities": { "input": [ "text" @@ -17414,27 +16754,28 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 200000, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-13", - "last_updated": "2025-04-13", + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { "input": 0.3, - "output": 0.3 + "output": 2.55 }, "type": "chat" }, { - "id": "soob3123/GrayLine-Qwen3-8B", - "name": "Grayline Qwen3 8B", - "display_name": "Grayline Qwen3 8B", + "id": "zai-org/glm-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ "text" @@ -17444,27 +16785,39 @@ ] }, "limit": { - "context": 16384, - "output": 32768 + "context": 200000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "open_weights": true, + "release_date": "2026-01-29", + "last_updated": "2026-01-29", "cost": { - "input": 0.3, - "output": 0.3 + "input": 0.15, + "output": 0.8 }, "type": "chat" }, { - "id": "soob3123/amoral-gemma3-27B-v2", - "name": "Amoral Gemma3 27B v2", - "display_name": "Amoral Gemma3 27B v2", + "id": "zai-org/glm-5", + "name": "GLM 5", + "display_name": "GLM 5", "modalities": { "input": [ "text" @@ -17474,30 +16827,43 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 200000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-23", - "last_updated": "2025-05-23", + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { "input": 0.3, - "output": 0.3 + "output": 2.55 }, "type": "chat" }, { - "id": "nex-agi/deepseek-v3.1-nex-n1", - "name": "DeepSeek V3.1 Nex N1", - "display_name": "DeepSeek V3.1 Nex N1", + "id": "unsloth/gemma-3-27b-it", + "name": "Gemma 3 27B IT", + "display_name": "Gemma 3 27B IT", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" @@ -17505,56 +16871,57 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 96000 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-10", - "last_updated": "2025-12-10", + "release_date": "2025-03-10", + "last_updated": "2025-03-10", "cost": { - "input": 0.27999999999999997, - "output": 0.42000000000000004 + "input": 0.2992, + "output": 0.2992 }, "type": "chat" }, { - "id": "Envoid/Llama-3.05-NT-Storybreaker-Ministral-70B", - "name": "Llama 3.05 Storybreaker Ministral 70b", - "display_name": "Llama 3.05 Storybreaker Ministral 70b", + "id": "unsloth/gemma-3-12b-it", + "name": "Gemma 3 12B IT", + "display_name": "Gemma 3 12B IT", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 128000, + "output": 131072 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-03-10", + "last_updated": "2025-03-10", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.272, + "output": 0.272 }, "type": "chat" }, { - "id": "Envoid/Llama-3.05-Nemotron-Tenyxchat-Storybreaker-70B", - "name": "Nemotron Tenyxchat Storybreaker 70b", - "display_name": "Nemotron Tenyxchat Storybreaker 70b", + "id": "unsloth/gemma-3-1b-it", + "name": "Gemma 3 1B IT", + "display_name": "Gemma 3 1B IT", "modalities": { "input": [ "text" @@ -17564,7 +16931,7 @@ ] }, "limit": { - "context": 16384, + "context": 128000, "output": 8192 }, "tool_call": false, @@ -17573,18 +16940,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-03-10", + "last_updated": "2025-03-10", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.1003, + "output": 0.1003 }, "type": "chat" }, { - "id": "anthracite-org/magnum-v4-72b", - "name": "Magnum v4 72B", - "display_name": "Magnum v4 72B", + "id": "unsloth/gemma-3-4b-it", + "name": "Gemma 3 4B IT", + "display_name": "Gemma 3 4B IT", "modalities": { "input": [ "text", @@ -17595,7 +16962,7 @@ ] }, "limit": { - "context": 16384, + "context": 128000, "output": 8192 }, "tool_call": false, @@ -17604,18 +16971,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-03-10", + "last_updated": "2025-03-10", "cost": { - "input": 2.006, - "output": 2.992 + "input": 0.2006, + "output": 0.2006 }, "type": "chat" }, { - "id": "anthracite-org/magnum-v2-72b", - "name": "Magnum V2 72B", - "display_name": "Magnum V2 72B", + "id": "aion-labs/aion-1.0", + "name": "Aion 1.0", + "display_name": "Aion 1.0", "modalities": { "input": [ "text" @@ -17625,7 +16992,7 @@ ] }, "limit": { - "context": 16384, + "context": 65536, "output": 8192 }, "tool_call": false, @@ -17634,18 +17001,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "release_date": "2025-02-01", + "last_updated": "2025-02-01", "cost": { - "input": 2.006, - "output": 2.992 + "input": 3.995, + "output": 7.99 }, "type": "chat" }, { - "id": "ReadyArt/MS3.2-The-Omega-Directive-24B-Unslop-v2.0", - "name": "Omega Directive 24B Unslop v2.0", - "display_name": "Omega Directive 24B Unslop v2.0", + "id": "aion-labs/aion-rp-llama-3.1-8b", + "name": "Llama 3.1 8b (uncensored)", + "display_name": "Llama 3.1 8b (uncensored)", "modalities": { "input": [ "text" @@ -17655,8 +17022,8 @@ ] }, "limit": { - "context": 16384, - "output": 32768 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -17664,18 +17031,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.5, - "output": 0.5 + "input": 0.2006, + "output": 0.2006 }, "type": "chat" }, { - "id": "ReadyArt/The-Omega-Abomination-L-70B-v1.0", - "name": "The Omega Abomination V1", - "display_name": "The Omega Abomination V1", + "id": "aion-labs/aion-1.0-mini", + "name": "Aion 1.0 mini (DeepSeek)", + "display_name": "Aion 1.0 mini (DeepSeek)", "modalities": { "input": [ "text" @@ -17685,8 +17052,8 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 131072, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -17694,49 +17061,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-02-20", + "last_updated": "2025-02-20", "cost": { - "input": 0.7, - "output": 0.95 + "input": 0.7989999999999999, + "output": 1.394 }, "type": "chat" }, { - "id": "undi95/remm-slerp-l2-13b", - "name": "ReMM SLERP 13B", - "display_name": "ReMM SLERP 13B", + "id": "Doctor-Shotgun/MS3.2-24B-Magnum-Diamond", + "name": "MS3.2 24B Magnum Diamond", + "display_name": "MS3.2 24B Magnum Diamond", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 6144, - "output": 4096 + "context": 16384, + "output": 32768 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.7989999999999999, - "output": 1.2069999999999999 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "MarinaraSpaghetti/NemoMix-Unleashed-12B", - "name": "NemoMix 12B Unleashed", - "display_name": "NemoMix 12B Unleashed", + "id": "chutesai/Mistral-Small-3.2-24B-Instruct-2506", + "name": "Mistral Small 3.2 24b Instruct", + "display_name": "Mistral Small 3.2 24b Instruct", "modalities": { "input": [ "text" @@ -17746,8 +17112,8 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 128000, + "output": 131072 }, "tool_call": false, "reasoning": { @@ -17755,49 +17121,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.2, + "output": 0.4 }, "type": "chat" }, { - "id": "allenai/molmo-2-8b", - "name": "Molmo 2 8B", - "display_name": "Molmo 2 8B", + "id": "LLM360/K2-Think", + "name": "K2-Think", + "display_name": "K2-Think", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 36864, - "output": 36864 + "context": 128000, + "output": 32768 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.17, + "output": 0.68 }, "type": "chat" }, { - "id": "allenai/olmo-3.1-32b-instruct", - "name": "Olmo 3.1 32B Instruct", - "display_name": "Olmo 3.1 32B Instruct", + "id": "Sao10K/L3-8B-Stheno-v3.2", + "name": "Sao10K Stheno 8b", + "display_name": "Sao10K Stheno 8b", "modalities": { "input": [ "text" @@ -17807,7 +17172,7 @@ ] }, "limit": { - "context": 65536, + "context": 16384, "output": 8192 }, "tool_call": false, @@ -17816,18 +17181,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2026-01-25", - "last_updated": "2026-01-25", + "release_date": "2024-11-29", + "last_updated": "2024-11-29", "cost": { - "input": 0.2, - "output": 0.6 + "input": 0.2006, + "output": 0.2006 }, "type": "chat" }, { - "id": "allenai/olmo-3.1-32b-think", - "name": "Olmo 3.1 32B Think", - "display_name": "Olmo 3.1 32B Think", + "id": "Sao10K/L3.1-70B-Hanami-x1", + "name": "Llama 3.1 70B Hanami", + "display_name": "Llama 3.1 70B Hanami", "modalities": { "input": [ "text" @@ -17837,28 +17202,27 @@ ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-01-25", - "last_updated": "2026-01-25", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.15, - "output": 0.5 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "allenai/olmo-3-32b-think", - "name": "Olmo 3 32B Think", - "display_name": "Olmo 3 32B Think", + "id": "Sao10K/L3.3-70B-Euryale-v2.3", + "name": "Llama 3.3 70B Euryale", + "display_name": "Llama 3.3 70B Euryale", "modalities": { "input": [ "text" @@ -17868,28 +17232,27 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 20480, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.3, - "output": 0.44999999999999996 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "stepfun-ai/step-3.5-flash:thinking", - "name": "Step 3.5 Flash Thinking", - "display_name": "Step 3.5 Flash Thinking", + "id": "Sao10K/L3.1-70B-Euryale-v2.2", + "name": "Llama 3.1 70B Euryale", + "display_name": "Llama 3.1 70B Euryale", "modalities": { "input": [ "text" @@ -17899,28 +17262,27 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 20480, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-02-02", - "last_updated": "2026-02-02", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.306, + "output": 0.357 }, "type": "chat" }, { - "id": "stepfun-ai/step-3.5-flash", - "name": "Step 3.5 Flash", - "display_name": "Step 3.5 Flash", + "id": "amazon/nova-pro-v1", + "name": "Amazon Nova Pro 1.0", + "display_name": "Amazon Nova Pro 1.0", "modalities": { "input": [ "text" @@ -17930,28 +17292,27 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 300000, + "output": 32000 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-02-02", - "last_updated": "2026-02-02", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.7989999999999999, + "output": 3.1959999999999997 }, "type": "chat" }, { - "id": "zai-org/glm-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "amazon/nova-2-lite-v1", + "name": "Amazon Nova 2 Lite", + "display_name": "Amazon Nova 2 Lite", "modalities": { "input": [ "text" @@ -17961,39 +17322,27 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 1000000, + "output": 65535 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-29", - "last_updated": "2026-01-29", + "open_weights": false, + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.15, - "output": 0.8 + "input": 0.5099999999999999, + "output": 4.25 }, "type": "chat" }, { - "id": "zai-org/glm-5", - "name": "GLM 5", - "display_name": "GLM 5", + "id": "amazon/nova-lite-v1", + "name": "Amazon Nova Lite 1.0", + "display_name": "Amazon Nova Lite 1.0", "modalities": { "input": [ "text" @@ -18003,39 +17352,27 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 300000, + "output": 5120 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "open_weights": false, + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.3, - "output": 2.55 + "input": 0.0595, + "output": 0.238 }, "type": "chat" }, { - "id": "zai-org/glm-5.1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "amazon/nova-micro-v1", + "name": "Amazon Nova Micro 1.0", + "display_name": "Amazon Nova Micro 1.0", "modalities": { "input": [ "text" @@ -18045,33 +17382,27 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 128000, + "output": 5120 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "open_weights": false, + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.3, - "output": 2.55 + "input": 0.0357, + "output": 0.1394 }, "type": "chat" }, { - "id": "zai-org/glm-5.1:thinking", - "name": "GLM 5.1 Thinking", - "display_name": "GLM 5.1 Thinking", + "id": "CrucibleLab/L3.3-70B-Loki-V2.0", + "name": "L3.3 70B Loki v2.0", + "display_name": "L3.3 70B Loki v2.0", "modalities": { "input": [ "text" @@ -18081,28 +17412,27 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 16384, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "open_weights": false, + "release_date": "2026-01-22", + "last_updated": "2026-01-22", "cost": { - "input": 0.3, - "output": 2.55 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "zai-org/glm-5:thinking", - "name": "GLM 5 Thinking", - "display_name": "GLM 5 Thinking", + "id": "THUDM/GLM-4-32B-0414", + "name": "GLM 4 32B 0414", + "display_name": "GLM 4 32B 0414", "modalities": { "input": [ "text" @@ -18112,28 +17442,27 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 65536 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "open_weights": false, + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.3, - "output": 2.55 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "zai-org/glm-4.7-flash", - "name": "GLM 4.7 Flash", - "display_name": "GLM 4.7 Flash", + "id": "THUDM/GLM-Z1-32B-0414", + "name": "GLM Z1 32B 0414", + "display_name": "GLM Z1 32B 0414", "modalities": { "input": [ "text" @@ -18143,33 +17472,27 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 65536 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "open_weights": false, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.07, - "output": 0.4 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "featherless-ai/Qwerky-72B", - "name": "Qwerky 72B", - "display_name": "Qwerky 72B", + "id": "THUDM/GLM-Z1-Rumination-32B-0414", + "name": "GLM Z1 Rumination 32B 0414", + "display_name": "GLM Z1 Rumination 32B 0414", "modalities": { "input": [ "text" @@ -18180,7 +17503,7 @@ }, "limit": { "context": 32000, - "output": 8192 + "output": 65536 }, "tool_call": false, "reasoning": { @@ -18188,18 +17511,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-03-20", - "last_updated": "2025-03-20", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.5, - "output": 0.5 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "mlabonne/NeuralDaredevil-8B-abliterated", - "name": "Neural Daredevil 8B abliterated", - "display_name": "Neural Daredevil 8B abliterated", + "id": "THUDM/GLM-4-9B-0414", + "name": "GLM 4 9B 0414", + "display_name": "GLM 4 9B 0414", "modalities": { "input": [ "text" @@ -18209,8 +17532,8 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 32000, + "output": 8000 }, "tool_call": false, "reasoning": { @@ -18218,49 +17541,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.44, - "output": 0.44 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "raifle/sorcererlm-8x22b", - "name": "SorcererLM 8x22B", - "display_name": "SorcererLM 8x22B", + "id": "THUDM/GLM-Z1-9B-0414", + "name": "GLM Z1 9B 0414", + "display_name": "GLM Z1 9B 0414", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 8192 + "context": 32000, + "output": 8000 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 4.505, - "output": 4.505 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "mistralai/mixtral-8x7b-instruct-v0.1", - "name": "Mixtral 8x7B", - "display_name": "Mixtral 8x7B", + "id": "inflection/inflection-3-productivity", + "name": "Inflection 3 Productivity", + "display_name": "Inflection 3 Productivity", "modalities": { "input": [ "text" @@ -18270,8 +17592,8 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 8000, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -18279,18 +17601,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2024-10-11", + "last_updated": "2024-10-11", "cost": { - "input": 0.27, - "output": 0.27 + "input": 2.499, + "output": 9.996 }, "type": "chat" }, { - "id": "mistralai/mistral-saba", - "name": "Mistral Saba", - "display_name": "Mistral Saba", + "id": "inflection/inflection-3-pi", + "name": "Inflection 3 Pi", + "display_name": "Inflection 3 Pi", "modalities": { "input": [ "text" @@ -18300,8 +17622,8 @@ ] }, "limit": { - "context": 32000, - "output": 32768 + "context": 8000, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -18309,49 +17631,54 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "release_date": "2024-10-11", + "last_updated": "2024-10-11", "cost": { - "input": 0.1989, - "output": 0.595 + "input": 2.499, + "output": 9.996 }, "type": "chat" }, { - "id": "mistralai/mistral-large-3-675b-instruct-2512", - "name": "Mistral Large 3 675B", - "display_name": "Mistral Large 3 675B", + "id": "minimax/minimax-m2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 256000 + "context": 200000, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "release_date": "2025-12-19", + "last_updated": "2025-12-19", "cost": { - "input": 1, - "output": 3 + "input": 0.33, + "output": 1.32 }, "type": "chat" }, { - "id": "mistralai/devstral-2-123b-instruct-2512", - "name": "Devstral 2 123B", - "display_name": "Devstral 2 123B", + "id": "minimax/minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -18361,27 +17688,33 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 204800, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.4, - "output": 1.4 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "mistralai/codestral-2508", - "name": "Codestral 2508", - "display_name": "Codestral 2508", + "id": "minimax/minimax-m2-her", + "name": "MiniMax M2-her", + "display_name": "MiniMax M2-her", "modalities": { "input": [ "text" @@ -18391,8 +17724,8 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 65532, + "output": 2048 }, "tool_call": false, "reasoning": { @@ -18400,79 +17733,91 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-08-01", - "last_updated": "2025-08-01", + "release_date": "2026-01-24", + "last_updated": "2026-01-24", "cost": { - "input": 0.3, - "output": 0.8999999999999999 + "input": 0.30200000000000005, + "output": 1.2069999999999999 }, "type": "chat" }, { - "id": "mistralai/ministral-14b-instruct-2512", - "name": "Ministral 3 14B", - "display_name": "Ministral 3 14B", + "id": "minimax/minimax-m2.7", + "name": "MiniMax M2.7", + "display_name": "MiniMax M2.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 204800, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "mistralai/mistral-tiny", - "name": "Mistral Tiny", - "display_name": "Mistral Tiny", + "id": "minimax/minimax-01", + "name": "MiniMax 01", + "display_name": "MiniMax 01", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 1000192, + "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2023-12-11", - "last_updated": "2024-01-01", + "release_date": "2025-01-15", + "last_updated": "2025-01-15", "cost": { - "input": 0.25499999999999995, - "output": 0.25499999999999995 + "input": 0.1394, + "output": 1.1219999999999999 }, "type": "chat" }, { - "id": "mistralai/ministral-8b-2512", - "name": "Ministral 8B", - "display_name": "Ministral 8B", + "id": "Tongyi-Zhiwen/QwenLong-L1-32B", + "name": "QwenLong L1 32B", + "display_name": "QwenLong L1 32B", "modalities": { "input": [ "text" @@ -18482,8 +17827,8 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 40960 }, "tool_call": false, "reasoning": { @@ -18491,78 +17836,82 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-04", - "last_updated": "2025-12-04", + "release_date": "2025-01-25", + "last_updated": "2025-01-25", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.13999999999999999, + "output": 0.6 }, "type": "chat" }, { - "id": "mistralai/mixtral-8x22b-instruct-v0.1", - "name": "Mixtral 8x22B", - "display_name": "Mixtral 8x22B", + "id": "x-ai/grok-4-07-09", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 32768 + "context": 256000, + "output": 131072 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.8999999999999999, - "output": 0.8999999999999999 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "mistralai/mistral-medium-3.1", - "name": "Mistral Medium 3.1", - "display_name": "Mistral Medium 3.1", + "id": "x-ai/grok-4-fast:thinking", + "name": "Grok 4 Fast Thinking", + "display_name": "Grok 4 Fast Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 2000000, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.4, - "output": 2 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "mistralai/ministral-3b-2512", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "x-ai/grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ "text" @@ -18572,57 +17921,65 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 256000, + "output": 131072 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-12-04", - "last_updated": "2025-12-04", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.2, + "output": 1.5 }, "type": "chat" }, { - "id": "mistralai/Mistral-Nemo-Instruct-2407", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "x-ai/grok-4.1-fast-reasoning", + "name": "Grok 4.1 Fast Reasoning", + "display_name": "Grok 4.1 Fast Reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 2000000, + "output": 131072 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "cost": { - "input": 0.1003, - "output": 0.1207 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "mistralai/mistral-medium-3", - "name": "Mistral Medium 3", - "display_name": "Mistral Medium 3", + "id": "x-ai/grok-4-fast", + "name": "Grok 4 Fast", + "display_name": "Grok 4 Fast", "modalities": { "input": [ "text", @@ -18633,58 +17990,60 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 2000000, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-09-20", + "last_updated": "2025-09-20", "cost": { - "input": 0.4, - "output": 2 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "mistralai/mistral-7b-instruct", - "name": "Mistral 7B Instruct", - "display_name": "Mistral 7B Instruct", + "id": "x-ai/grok-4.1-fast", + "name": "Grok 4.1 Fast", + "display_name": "Grok 4.1 Fast", "modalities": { "input": [ "text", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 2000000, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2024-05-27", - "last_updated": "2024-05-27", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "cost": { - "input": 0.0544, - "output": 0.0544 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "mistralai/Devstral-Small-2505", - "name": "Mistral Devstral Small 2505", - "display_name": "Mistral Devstral Small 2505", + "id": "Salesforce/Llama-xLAM-2-70b-fc-r", + "name": "Llama-xLAM-2 70B fc-r", + "display_name": "Llama-xLAM-2 70B fc-r", "modalities": { "input": [ "text" @@ -18694,8 +18053,8 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -18703,18 +18062,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-08-02", - "last_updated": "2025-08-02", + "release_date": "2025-04-13", + "last_updated": "2025-04-13", "cost": { - "input": 0.060000000000000005, - "output": 0.060000000000000005 + "input": 2.5, + "output": 2.5 }, "type": "chat" }, { - "id": "mistralai/mistral-small-creative", - "name": "Mistral Small Creative", - "display_name": "Mistral Small Creative", + "id": "nvidia/nvidia-nemotron-nano-9b-v2", + "name": "Nvidia Nemotron Nano 9B v2", + "display_name": "Nvidia Nemotron Nano 9B v2", "modalities": { "input": [ "text" @@ -18724,27 +18083,27 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "release_date": "2025-08-18", + "last_updated": "2025-08-18", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.17, + "output": 0.68 }, "type": "chat" }, { - "id": "mistralai/mistral-large", - "name": "Mistral Large 2411", - "display_name": "Mistral Large 2411", + "id": "nvidia/Llama-3_3-Nemotron-Super-49B-v1_5", + "name": "Nvidia Nemotron Super 49B v1.5", + "display_name": "Nvidia Nemotron Super 49B v1.5", "modalities": { "input": [ "text" @@ -18755,7 +18114,7 @@ }, "limit": { "context": 128000, - "output": 256000 + "output": 16384 }, "tool_call": false, "reasoning": { @@ -18763,18 +18122,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-02-26", - "last_updated": "2024-02-26", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 2.006, - "output": 6.001 + "input": 0.05, + "output": 0.25 }, "type": "chat" }, { - "id": "mistralai/ministral-14b-2512", - "name": "Ministral 14B", - "display_name": "Ministral 14B", + "id": "nvidia/Llama-3.3-Nemotron-Super-49B-v1", + "name": "Nvidia Nemotron Super 49B", + "display_name": "Nvidia Nemotron Super 49B", "modalities": { "input": [ "text" @@ -18784,8 +18143,8 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -18793,18 +18152,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-04", - "last_updated": "2025-12-04", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "shisa-ai/shisa-v2.1-llama3.3-70b", - "name": "Shisa V2.1 Llama 3.3 70B", - "display_name": "Shisa V2.1 Llama 3.3 70B", + "id": "nvidia/Llama-3.1-Nemotron-70B-Instruct-HF", + "name": "Nvidia Nemotron 70b", + "display_name": "Nvidia Nemotron 70b", "modalities": { "input": [ "text" @@ -18814,8 +18173,8 @@ ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 16384, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -18823,18 +18182,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.5, - "output": 0.5 + "input": 0.357, + "output": 0.408 }, "type": "chat" }, { - "id": "shisa-ai/shisa-v2-llama3.3-70b", - "name": "Shisa V2 Llama 3.3 70B", - "display_name": "Shisa V2 Llama 3.3 70B", + "id": "nvidia/Llama-3.1-Nemotron-Ultra-253B-v1", + "name": "Nvidia Nemotron Ultra 253B", + "display_name": "Nvidia Nemotron Ultra 253B", "modalities": { "input": [ "text" @@ -18853,18 +18212,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "release_date": "2025-07-03", + "last_updated": "2025-07-03", "cost": { - "input": 0.5, - "output": 0.5 + "input": 0.4, + "output": 0.8 }, "type": "chat" }, { - "id": "meta-llama/llama-3.3-70b-instruct", - "name": "Llama 3.3 70b Instruct", - "display_name": "Llama 3.3 70b Instruct", + "id": "nvidia/nemotron-3-nano-30b-a3b", + "name": "Nvidia Nemotron 3 Nano 30B", + "display_name": "Nvidia Nemotron 3 Nano 30B", "modalities": { "input": [ "text" @@ -18874,122 +18233,269 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 256000, + "output": 262144 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27", + "release_date": "2025-12-15", + "last_updated": "2025-12-15", "cost": { - "input": 0.05, - "output": 0.23 + "input": 0.17, + "output": 0.68 }, "type": "chat" }, { - "id": "meta-llama/llama-4-scout", - "name": "Llama 4 Scout", - "display_name": "Llama 4 Scout", + "id": "anthropic/claude-sonnet-4.6:thinking", + "name": "Claude Sonnet 4.6 Thinking", + "display_name": "Claude Sonnet 4.6 Thinking", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 328000, - "output": 65536 + "context": 1000000, + "output": 128000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 0.085, - "output": 0.46 + "input": 2.992, + "output": 14.993999999999998 }, "type": "chat" }, { - "id": "meta-llama/llama-4-maverick", - "name": "Llama 4 Maverick", - "display_name": "Llama 4 Maverick", + "id": "anthropic/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 128000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 0.18000000000000002, - "output": 0.8 + "input": 2.992, + "output": 14.993999999999998 }, "type": "chat" }, { - "id": "meta-llama/llama-3.2-90b-vision-instruct", - "name": "Llama 3.2 Medium", - "display_name": "Llama 3.2 Medium", + "id": "anthropic/claude-opus-4.6:thinking:low", + "name": "Claude 4.6 Opus Thinking Low", + "display_name": "Claude 4.6 Opus Thinking Low", "modalities": { "input": [ + "text", + "image", + "pdf" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 1000000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "cost": { + "input": 4.998, + "output": 25.007 + }, + "type": "chat" + }, + { + "id": "anthropic/claude-opus-4.6", + "name": "Claude 4.6 Opus", + "display_name": "Claude 4.6 Opus", + "modalities": { + "input": [ + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1000000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.9009999999999999, - "output": 0.9009999999999999 + "input": 4.998, + "output": 25.007 }, "type": "chat" }, { - "id": "meta-llama/llama-3.2-3b-instruct", - "name": "Llama 3.2 3b Instruct", - "display_name": "Llama 3.2 3b Instruct", + "id": "anthropic/claude-opus-4.6:thinking:medium", + "name": "Claude 4.6 Opus Thinking Medium", + "display_name": "Claude 4.6 Opus Thinking Medium", "modalities": { "input": [ "text", + "image", "pdf" ], "output": [ @@ -18997,50 +18503,165 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.0306, - "output": 0.0493 + "input": 4.998, + "output": 25.007 }, "type": "chat" }, { - "id": "meta-llama/llama-3.1-8b-instruct", - "name": "Llama 3.1 8b Instruct", - "display_name": "Llama 3.1 8b Instruct", + "id": "anthropic/claude-opus-4.6:thinking:max", + "name": "Claude 4.6 Opus Thinking Max", + "display_name": "Claude 4.6 Opus Thinking Max", "modalities": { "input": [ + "text", + "image", + "pdf" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 1000000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "cost": { + "input": 4.998, + "output": 25.007 + }, + "type": "chat" + }, + { + "id": "anthropic/claude-opus-4.6:thinking", + "name": "Claude 4.6 Opus Thinking", + "display_name": "Claude 4.6 Opus Thinking", + "modalities": { + "input": [ + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1000000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.0544, - "output": 0.0544 + "input": 4.998, + "output": 25.007 }, "type": "chat" }, @@ -19075,9 +18696,9 @@ "type": "chat" }, { - "id": "baseten/Kimi-K2-Instruct-FP4", - "name": "Kimi K2 0711 Instruct FP4", - "display_name": "Kimi K2 0711 Instruct FP4", + "id": "shisa-ai/shisa-v2-llama3.3-70b", + "name": "Shisa V2 Llama 3.3 70B", + "display_name": "Shisa V2 Llama 3.3 70B", "modalities": { "input": [ "text" @@ -19088,7 +18709,7 @@ }, "limit": { "context": 128000, - "output": 131072 + "output": 16384 }, "tool_call": false, "reasoning": { @@ -19096,18 +18717,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 0.1, - "output": 2 + "input": 0.5, + "output": 0.5 }, "type": "chat" }, { - "id": "Gryphe/MythoMax-L2-13b", - "name": "MythoMax 13B", - "display_name": "MythoMax 13B", + "id": "shisa-ai/shisa-v2.1-llama3.3-70b", + "name": "Shisa V2.1 Llama 3.3 70B", + "display_name": "Shisa V2.1 Llama 3.3 70B", "modalities": { "input": [ "text" @@ -19117,7 +18738,7 @@ ] }, "limit": { - "context": 4000, + "context": 32768, "output": 4096 }, "tool_call": false, @@ -19126,18 +18747,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.1003, - "output": 0.1003 + "input": 0.5, + "output": 0.5 }, "type": "chat" }, { - "id": "x-ai/grok-4-fast:thinking", - "name": "Grok 4 Fast Thinking", - "display_name": "Grok 4 Fast Thinking", + "id": "mistralai/ministral-14b-instruct-2512", + "name": "Ministral 3 14B", + "display_name": "Ministral 3 14B", "modalities": { "input": [ "text", @@ -19148,28 +18769,27 @@ ] }, "limit": { - "context": 2000000, - "output": 131072 + "context": 262144, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "x-ai/grok-4-07-09", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "mistralai/mistral-large-3-675b-instruct-2512", + "name": "Mistral Large 3 675B", + "display_name": "Mistral Large 3 675B", "modalities": { "input": [ "text", @@ -19180,60 +18800,57 @@ ] }, "limit": { - "context": 256000, - "output": 131072 + "context": 262144, + "output": 256000 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 3, - "output": 15 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "x-ai/grok-4-fast", - "name": "Grok 4 Fast", - "display_name": "Grok 4 Fast", + "id": "mistralai/Devstral-Small-2505", + "name": "Mistral Devstral Small 2505", + "display_name": "Mistral Devstral Small 2505", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 131072 + "context": 32768, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-20", - "last_updated": "2025-09-20", + "release_date": "2025-08-02", + "last_updated": "2025-08-02", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.060000000000000005, + "output": 0.060000000000000005 }, "type": "chat" }, { - "id": "x-ai/grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "mistralai/mistral-saba", + "name": "Mistral Saba", + "display_name": "Mistral Saba", "modalities": { "input": [ "text" @@ -19243,97 +18860,87 @@ ] }, "limit": { - "context": 256000, - "output": 131072 + "context": 32000, + "output": 32768 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0.2, - "output": 1.5 + "input": 0.1989, + "output": 0.595 }, "type": "chat" }, { - "id": "x-ai/grok-4.1-fast", - "name": "Grok 4.1 Fast", - "display_name": "Grok 4.1 Fast", + "id": "mistralai/mistral-small-creative", + "name": "Mistral Small Creative", + "display_name": "Mistral Small Creative", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 131072 + "context": 32768, + "output": 32768 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-20", - "last_updated": "2025-11-20", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "x-ai/grok-4.1-fast-reasoning", - "name": "Grok 4.1 Fast Reasoning", - "display_name": "Grok 4.1 Fast Reasoning", + "id": "mistralai/codestral-2508", + "name": "Codestral 2508", + "display_name": "Codestral 2508", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 131072 + "context": 256000, + "output": 32768 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-20", - "last_updated": "2025-11-20", + "release_date": "2025-08-01", + "last_updated": "2025-08-01", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.3, + "output": 0.8999999999999999 }, "type": "chat" }, { - "id": "tencent/Hunyuan-MT-7B", - "name": "Hunyuan MT 7B", - "display_name": "Hunyuan MT 7B", + "id": "mistralai/mixtral-8x22b-instruct-v0.1", + "name": "Mixtral 8x22B", + "display_name": "Mixtral 8x22B", "modalities": { "input": [ "text" @@ -19343,8 +18950,8 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 65536, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -19352,53 +18959,51 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 10, - "output": 20 + "input": 0.8999999999999999, + "output": 0.8999999999999999 }, "type": "chat" }, { - "id": "microsoft/wizardlm-2-8x22b", - "name": "WizardLM-2 8x22B", - "display_name": "WizardLM-2 8x22B", + "id": "mistralai/ministral-14b-2512", + "name": "Ministral 14B", + "display_name": "Ministral 14B", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 262144, + "output": 32768 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "release_date": "2025-12-04", + "last_updated": "2025-12-04", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "microsoft/MAI-DS-R1-FP8", - "name": "Microsoft DeepSeek R1", - "display_name": "Microsoft DeepSeek R1", + "id": "mistralai/mistral-large", + "name": "Mistral Large 2411", + "display_name": "Mistral Large 2411", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" @@ -19406,26 +19011,26 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 256000 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2024-02-26", + "last_updated": "2024-02-26", "cost": { - "input": 0.3, - "output": 0.3 + "input": 2.006, + "output": 6.001 }, "type": "chat" }, { - "id": "cohere/command-r", - "name": "Cohere: Command R", - "display_name": "Cohere: Command R", + "id": "mistralai/ministral-3b-2512", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ "text" @@ -19435,8 +19040,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -19444,18 +19049,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-03-11", - "last_updated": "2024-03-11", + "release_date": "2025-12-04", + "last_updated": "2025-12-04", "cost": { - "input": 0.476, - "output": 1.428 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "cohere/command-r-plus-08-2024", - "name": "Cohere: Command R+", - "display_name": "Cohere: Command R+", + "id": "mistralai/Mistral-Nemo-Instruct-2407", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -19465,87 +19070,89 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 16384, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 2.856, - "output": 14.246 + "input": 0.1003, + "output": 0.1207 }, "type": "chat" }, { - "id": "chutesai/Mistral-Small-3.2-24B-Instruct-2506", - "name": "Mistral Small 3.2 24b Instruct", - "display_name": "Mistral Small 3.2 24b Instruct", + "id": "mistralai/mistral-medium-3", + "name": "Mistral Medium 3", + "display_name": "Mistral Medium 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 131072 + "context": 131072, + "output": 32768 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.2, - "output": 0.4 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "nvidia/Llama-3.1-Nemotron-Ultra-253B-v1", - "name": "Nvidia Nemotron Ultra 253B", - "display_name": "Nvidia Nemotron Ultra 253B", + "id": "mistralai/mistral-7b-instruct", + "name": "Mistral 7B Instruct", + "display_name": "Mistral 7B Instruct", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-03", - "last_updated": "2025-07-03", + "release_date": "2024-05-27", + "last_updated": "2024-05-27", "cost": { - "input": 0.4, - "output": 0.8 + "input": 0.0544, + "output": 0.0544 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-nano-30b-a3b", - "name": "Nvidia Nemotron 3 Nano 30B", - "display_name": "Nvidia Nemotron 3 Nano 30B", + "id": "mistralai/mixtral-8x7b-instruct-v0.1", + "name": "Mixtral 8x7B", + "display_name": "Mixtral 8x7B", "modalities": { "input": [ "text" @@ -19555,8 +19162,8 @@ ] }, "limit": { - "context": 256000, - "output": 262144 + "context": 32768, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -19564,18 +19171,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-15", - "last_updated": "2025-12-15", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.17, - "output": 0.68 + "input": 0.27, + "output": 0.27 }, "type": "chat" }, { - "id": "nvidia/nvidia-nemotron-nano-9b-v2", - "name": "Nvidia Nemotron Nano 9B v2", - "display_name": "Nvidia Nemotron Nano 9B v2", + "id": "mistralai/ministral-8b-2512", + "name": "Ministral 8B", + "display_name": "Ministral 8B", "modalities": { "input": [ "text" @@ -19585,8 +19192,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -19594,18 +19201,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-08-18", - "last_updated": "2025-08-18", + "release_date": "2025-12-04", + "last_updated": "2025-12-04", "cost": { - "input": 0.17, - "output": 0.68 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "nvidia/Llama-3.1-Nemotron-70B-Instruct-HF", - "name": "Nvidia Nemotron 70b", - "display_name": "Nvidia Nemotron 70b", + "id": "mistralai/devstral-2-123b-instruct-2512", + "name": "Devstral 2 123B", + "display_name": "Devstral 2 123B", "modalities": { "input": [ "text" @@ -19615,8 +19222,8 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 262144, + "output": 65536 }, "tool_call": false, "reasoning": { @@ -19624,18 +19231,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "cost": { - "input": 0.357, - "output": 0.408 + "input": 0.4, + "output": 1.4 }, "type": "chat" }, { - "id": "nvidia/Llama-3.3-Nemotron-Super-49B-v1", - "name": "Nvidia Nemotron Super 49B", - "display_name": "Nvidia Nemotron Super 49B", + "id": "mistralai/mistral-tiny", + "name": "Mistral Tiny", + "display_name": "Mistral Tiny", "modalities": { "input": [ "text" @@ -19645,8 +19252,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32000, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -19654,18 +19261,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "release_date": "2023-12-11", + "last_updated": "2024-01-01", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.25499999999999995, + "output": 0.25499999999999995 }, "type": "chat" }, { - "id": "nvidia/Llama-3_3-Nemotron-Super-49B-v1_5", - "name": "Nvidia Nemotron Super 49B v1.5", - "display_name": "Nvidia Nemotron Super 49B v1.5", + "id": "mistralai/mistral-medium-3.1", + "name": "Mistral Medium 3.1", + "display_name": "Mistral Medium 3.1", "modalities": { "input": [ "text" @@ -19675,8 +19282,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -19684,109 +19291,148 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.05, - "output": 0.25 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1:thinking", - "name": "DeepSeek V3.1 Thinking", - "display_name": "DeepSeek V3.1 Thinking", + "id": "qwen/Qwen3.6-35B-A3B:thinking", + "name": "Qwen3.6 35B A3B Thinking", + "display_name": "Qwen3.6 35B A3B Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 262144, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "open_weights": true, + "release_date": "2026-04-19", + "last_updated": "2026-04-21", "cost": { - "input": 0.2, - "output": 0.7 + "input": 0.29, + "output": 1.74 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "qwen/qwen3.5-397b-a17b", + "name": "Qwen3.5 397B A17B", + "display_name": "Qwen3.5 397B A17B", "modalities": { "input": [ "text", - "pdf" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 258048, "output": 65536 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.2, - "output": 0.7 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1-Terminus:thinking", - "name": "DeepSeek V3.1 Terminus (Thinking)", - "display_name": "DeepSeek V3.1 Terminus (Thinking)", + "id": "qwen/Qwen3.6-35B-A3B", + "name": "Qwen3.6 35B A3B", + "display_name": "Qwen3.6 35B A3B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 262144, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "open_weights": true, + "release_date": "2026-04-17", + "last_updated": "2026-04-21", "cost": { - "input": 0.25, - "output": 0.7 + "input": 0.29, + "output": 1.74 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-v3.2-exp-thinking", - "name": "DeepSeek V3.2 Exp Thinking", - "display_name": "DeepSeek V3.2 Exp Thinking", + "id": "tencent/Hunyuan-MT-7B", + "name": "Hunyuan MT 7B", + "display_name": "Hunyuan MT 7B", "modalities": { "input": [ "text" @@ -19796,28 +19442,27 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 0.27999999999999997, - "output": 0.42000000000000004 + "input": 10, + "output": 20 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-v3.2-exp", - "name": "DeepSeek V3.2 Exp", - "display_name": "DeepSeek V3.2 Exp", + "id": "google/gemini-flash-1.5", + "name": "Gemini 1.5 Flash", + "display_name": "Gemini 1.5 Flash", "modalities": { "input": [ "text" @@ -19827,8 +19472,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 2000000, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -19836,29 +19481,30 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", - "cost": { - "input": 0.27999999999999997, - "output": 0.42000000000000004 + "release_date": "2024-05-14", + "last_updated": "2024-05-14", + "cost": { + "input": 0.0748, + "output": 0.306 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", + "id": "google/gemini-3-flash-preview-thinking", + "name": "Gemini 3 Flash Thinking", + "display_name": "Gemini 3 Flash Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 163840 + "context": 1048756, + "output": 65536 }, "tool_call": false, "reasoning": { @@ -19868,147 +19514,122 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-05-28", - "cost": { - "input": 0.4, - "output": 1.7 - }, - "type": "chat" - }, - { - "id": "deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 65536 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-02", - "last_updated": "2025-08-02", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.25, - "output": 0.7 + "input": 0.5, + "output": 3 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-max", - "name": "GPT 5.1 Codex Max", - "display_name": "GPT 5.1 Codex Max", + "id": "google/gemini-3-flash-preview", + "name": "Gemini 3 Flash (Preview)", + "display_name": "Gemini 3 Flash (Preview)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048756, + "output": 65536 }, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", "low", "medium", "high" ], - "visibility": "hidden" + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 2.5, - "output": 20 + "input": 0.5, + "output": 3 }, "type": "chat" }, { - "id": "openai/gpt-5.2-chat", - "name": "GPT 5.2 Chat", - "display_name": "GPT 5.2 Chat", + "id": "microsoft/wizardlm-2-8x22b", + "name": "WizardLM-2 8x22B", + "display_name": "WizardLM-2 8x22B", "modalities": { "input": [ "text", - "image" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 16384 + "context": 65536, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-01-01", - "last_updated": "2026-01-01", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 1.75, - "output": 14 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini-search-preview", - "name": "GPT-4o mini Search Preview", - "display_name": "GPT-4o mini Search Preview", + "id": "microsoft/MAI-DS-R1-FP8", + "name": "Microsoft DeepSeek R1", + "display_name": "Microsoft DeepSeek R1", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" @@ -20016,220 +19637,151 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.088, - "output": 0.35 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "openai/chatgpt-4o-latest", - "name": "ChatGPT 4o", - "display_name": "ChatGPT 4o", + "id": "pamanseau/OpenReasoning-Nemotron-32B", + "name": "OpenReasoning Nemotron 32B", + "display_name": "OpenReasoning Nemotron 32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 65536 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 4.998, - "output": 14.993999999999998 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "openai/gpt-5.2-pro", - "name": "GPT 5.2 Pro", - "display_name": "GPT 5.2 Pro", + "id": "Infermatic/MN-12B-Inferor-v0.0", + "name": "Mistral Nemo Inferor 12B", + "display_name": "Mistral Nemo Inferor 12B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-01-01", - "last_updated": "2026-01-01", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 21, - "output": 168 + "input": 0.25499999999999995, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "GPT 5 Mini", - "display_name": "GPT 5 Mini", + "id": "NeverSleep/Lumimaid-v0.2-70B", + "name": "Lumimaid v0.2", + "display_name": "Lumimaid v0.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.25, - "output": 2 + "input": 1, + "output": 1.5 }, "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "GPT 5 Nano", - "display_name": "GPT 5 Nano", + "id": "NeverSleep/Llama-3-Lumimaid-70B-v0.1", + "name": "Lumimaid 70b", + "display_name": "Lumimaid 70b", "modalities": { "input": [ "text", - "image" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.05, - "output": 0.4 + "input": 2.006, + "output": 2.006 }, "type": "chat" }, { - "id": "openai/gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "nex-agi/deepseek-v3.1-nex-n1", + "name": "DeepSeek V3.1 Nex N1", + "display_name": "DeepSeek V3.1 Nex N1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -20237,30 +19789,29 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2023-11-06", - "last_updated": "2024-01-01", + "release_date": "2025-12-10", + "last_updated": "2025-12-10", "cost": { - "input": 10, - "output": 30 + "input": 0.27999999999999997, + "output": 0.42000000000000004 }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "GPT 5.2", - "display_name": "GPT 5.2", + "id": "anthracite-org/magnum-v4-72b", + "name": "Magnum v4 72B", + "display_name": "Magnum v4 72B", "modalities": { "input": [ "text", - "image", "pdf" ], "output": [ @@ -20268,50 +19819,27 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-01-01", - "last_updated": "2026-01-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.75, - "output": 14 + "input": 2.006, + "output": 2.992 }, "type": "chat" }, { - "id": "openai/o3-mini-high", - "name": "OpenAI o3-mini (High)", - "display_name": "OpenAI o3-mini (High)", + "id": "anthracite-org/magnum-v2-72b", + "name": "Magnum V2 72B", + "display_name": "Magnum V2 72B", "modalities": { "input": [ "text" @@ -20321,302 +19849,218 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 16384, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.64, - "output": 2.588 + "input": 2.006, + "output": 2.992 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "deepseek/deepseek-prover-v2-671b", + "name": "DeepSeek Prover v2 671B", + "display_name": "DeepSeek Prover v2 671B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 160000, "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2025-04-30", + "last_updated": "2025-04-30", "cost": { - "input": 0.1496, - "output": 0.595 + "input": 1, + "output": 2.5 }, "type": "chat" }, { - "id": "openai/o4-mini-deep-research", - "name": "OpenAI o4-mini Deep Research", - "display_name": "OpenAI o4-mini Deep Research", + "id": "deepseek/deepseek-v3.2-speciale", + "name": "DeepSeek V3.2 Speciale", + "display_name": "DeepSeek V3.2 Speciale", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 163000, + "output": 65536 }, "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 9.996, - "output": 19.992 + "input": 0.27999999999999997, + "output": 0.42000000000000004 }, "type": "chat" }, { - "id": "openai/gpt-5.1-chat", - "name": "GPT 5.1 Chat", - "display_name": "GPT 5.1 Chat", + "id": "deepseek/deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text", - "image" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 163000, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 1.25, - "output": 10 + "input": 0.27999999999999997, + "output": 0.42000000000000004 }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "OpenAI o4-mini", - "display_name": "OpenAI o4-mini", + "id": "deepseek/deepseek-v3.2:thinking", + "name": "DeepSeek V3.2 Thinking", + "display_name": "DeepSeek V3.2 Thinking", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 163000, + "output": 65536 }, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 1.1, - "output": 4.4 + "input": 0.27999999999999997, + "output": 0.42000000000000004 }, "type": "chat" }, { - "id": "openai/gpt-5.2-codex", - "name": "GPT 5.2 Codex", - "display_name": "GPT 5.2 Codex", + "id": "huihui-ai/DeepSeek-R1-Distill-Llama-70B-abliterated", + "name": "DeepSeek R1 Llama 70B Abliterated", + "display_name": "DeepSeek R1 Llama 70B Abliterated", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 1.75, - "output": 14 + "input": 0.7, + "output": 0.7 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-mini", - "name": "GPT 5.1 Codex Mini", - "display_name": "GPT 5.1 Codex Mini", + "id": "huihui-ai/Llama-3.1-Nemotron-70B-Instruct-HF-abliterated", + "name": "Nemotron 3.1 70B abliterated", + "display_name": "Nemotron 3.1 70B abliterated", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.25, - "output": 2 + "input": 0.7, + "output": 0.7 }, "type": "chat" }, { - "id": "openai/o1-preview", - "name": "OpenAI o1-preview", - "display_name": "OpenAI o1-preview", + "id": "huihui-ai/Qwen2.5-32B-Instruct-abliterated", + "name": "Qwen 2.5 32B Abliterated", + "display_name": "Qwen 2.5 32B Abliterated", "modalities": { "input": [ "text" @@ -20626,127 +20070,88 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 32768, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "release_date": "2025-01-06", + "last_updated": "2025-01-06", "cost": { - "input": 14.993999999999998, - "output": 59.993 + "input": 0.7, + "output": 0.7 }, "type": "chat" }, { - "id": "openai/gpt-4o-2024-08-06", - "name": "GPT-4o (2024-08-06)", - "display_name": "GPT-4o (2024-08-06)", + "id": "huihui-ai/DeepSeek-R1-Distill-Qwen-32B-abliterated", + "name": "DeepSeek R1 Qwen Abliterated", + "display_name": "DeepSeek R1 Qwen Abliterated", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 16384, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-08-06", - "last_updated": "2024-08-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 2.499, - "output": 9.996 + "input": 1.4, + "output": 1.4 }, "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "GPT 5.1", - "display_name": "GPT 5.1", + "id": "huihui-ai/Llama-3.3-70B-Instruct-abliterated", + "name": "Llama 3.3 70B Instruct abliterated", + "display_name": "Llama 3.3 70B Instruct abliterated", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 1.25, - "output": 10 + "input": 0.7, + "output": 0.7 }, "type": "chat" }, { - "id": "openai/o1", - "name": "OpenAI o1", - "display_name": "OpenAI o1", + "id": "ReadyArt/MS3.2-The-Omega-Directive-24B-Unslop-v2.0", + "name": "Omega Directive 24B Unslop v2.0", + "display_name": "Omega Directive 24B Unslop v2.0", "modalities": { "input": [ "text" @@ -20756,42 +20161,27 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 16384, + "output": 32768 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-12-17", - "last_updated": "2024-12-17", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 14.993999999999998, - "output": 59.993 + "input": 0.5, + "output": 0.5 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo", - "name": "GPT-3.5 Turbo", - "display_name": "GPT-3.5 Turbo", + "id": "ReadyArt/The-Omega-Abomination-L-70B-v1.0", + "name": "The Omega Abomination V1", + "display_name": "The Omega Abomination V1", "modalities": { "input": [ "text" @@ -20801,8 +20191,8 @@ ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -20810,18 +20200,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2022-11-30", - "last_updated": "2024-01-01", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.7, + "output": 0.95 }, "type": "chat" }, { - "id": "openai/o3-deep-research", - "name": "OpenAI o3 Deep Research", - "display_name": "OpenAI o3 Deep Research", + "id": "featherless-ai/Qwerky-72B", + "name": "Qwerky 72B", + "display_name": "Qwerky 72B", "modalities": { "input": [ "text" @@ -20831,42 +20221,27 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 32000, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2025-03-20", + "last_updated": "2025-03-20", "cost": { - "input": 9.996, - "output": 19.992 + "input": 0.5, + "output": 0.5 }, "type": "chat" }, { - "id": "openai/o3-mini", - "name": "OpenAI o3-mini", - "display_name": "OpenAI o3-mini", + "id": "meituan-longcat/LongCat-Flash-Chat-FP8", + "name": "LongCat Flash", + "display_name": "LongCat Flash", "modalities": { "input": [ "text" @@ -20876,42 +20251,27 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 32768 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "release_date": "2025-08-31", + "last_updated": "2025-08-31", "cost": { - "input": 1.1, - "output": 4.4 + "input": 0.15, + "output": 0.7 }, "type": "chat" }, { - "id": "openai/gpt-4-turbo-preview", - "name": "GPT-4 Turbo Preview", - "display_name": "GPT-4 Turbo Preview", + "id": "failspy/Meta-Llama-3-70B-Instruct-abliterated-v3.5", + "name": "Llama 3 70B abliterated", + "display_name": "Llama 3 70B abliterated", "modalities": { "input": [ "text" @@ -20921,8 +20281,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -20930,65 +20290,49 @@ }, "attachment": false, "open_weights": false, - "release_date": "2023-11-06", - "last_updated": "2024-01-01", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 9.996, - "output": 30.004999999999995 + "input": 0.7, + "output": 0.7 }, "type": "chat" }, { - "id": "openai/o1-pro", - "name": "OpenAI o1 Pro", - "display_name": "OpenAI o1 Pro", + "id": "meta-llama/llama-4-scout", + "name": "Llama 4 Scout", + "display_name": "Llama 4 Scout", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 328000, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-01-25", - "last_updated": "2025-01-25", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 150, - "output": 600 + "input": 0.085, + "output": 0.46 }, "type": "chat" }, { - "id": "openai/gpt-5-codex", - "name": "GPT-5 Codex", - "display_name": "GPT-5 Codex", + "id": "meta-llama/llama-3.2-90b-vision-instruct", + "name": "Llama 3.2 Medium", + "display_name": "Llama 3.2 Medium", "modalities": { "input": [ "text" @@ -20998,49 +20342,27 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 131072, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 9.996, - "output": 19.992 + "input": 0.9009999999999999, + "output": 0.9009999999999999 }, "type": "chat" }, { - "id": "openai/gpt-5.1-chat-latest", - "name": "GPT 5.1 Chat (Latest)", - "display_name": "GPT 5.1 Chat (Latest)", + "id": "meta-llama/llama-4-maverick", + "name": "Llama 4 Maverick", + "display_name": "Llama 4 Maverick", "modalities": { "input": [ "text", @@ -21051,63 +20373,60 @@ ] }, "limit": { - "context": 400000, - "output": 16384 + "context": 1048576, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 1.25, - "output": 10 + "input": 0.18000000000000002, + "output": 0.8 }, "type": "chat" }, { - "id": "openai/gpt-4o-search-preview", - "name": "GPT-4o Search Preview", - "display_name": "GPT-4o Search Preview", + "id": "meta-llama/llama-3.3-70b-instruct", + "name": "Llama 3.3 70b Instruct", + "display_name": "Llama 3.3 70b Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 16384 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "release_date": "2025-02-27", + "last_updated": "2025-02-27", "cost": { - "input": 1.47, - "output": 5.88 + "input": 0.05, + "output": 0.23 }, "type": "chat" }, { - "id": "openai/gpt-4.1-nano", - "name": "GPT 4.1 Nano", - "display_name": "GPT 4.1 Nano", + "id": "meta-llama/llama-3.2-3b-instruct", + "name": "Llama 3.2 3b Instruct", + "display_name": "Llama 3.2 3b Instruct", "modalities": { "input": [ "text", - "image", "pdf" ], "output": [ @@ -21115,8 +20434,8 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 131072, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -21124,18 +20443,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.0306, + "output": 0.0493 }, "type": "chat" }, { - "id": "openai/o4-mini-high", - "name": "OpenAI o4-mini high", - "display_name": "OpenAI o4-mini high", + "id": "meta-llama/llama-3.1-8b-instruct", + "name": "Llama 3.1 8b Instruct", + "display_name": "Llama 3.1 8b Instruct", "modalities": { "input": [ "text" @@ -21145,42 +20464,27 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 1.1, - "output": 4.4 + "input": 0.0544, + "output": 0.0544 }, "type": "chat" }, { - "id": "openai/o3", - "name": "OpenAI o3", - "display_name": "OpenAI o3", + "id": "VongolaChouko/Starcannon-Unleashed-12B-v1.0", + "name": "Mistral Nemo Starcannon 12b v1", + "display_name": "Mistral Nemo Starcannon 12b v1", "modalities": { "input": [ "text" @@ -21190,42 +20494,27 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 16384, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 2, - "output": 8 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "arcee-ai/trinity-mini", + "name": "Trinity Mini", + "display_name": "Trinity Mini", "modalities": { "input": [ "text" @@ -21235,80 +20524,57 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.04, + "input": 0.045000000000000005, "output": 0.15 }, "type": "chat" }, { - "id": "openai/gpt-5-pro", - "name": "GPT 5 Pro", - "display_name": "GPT 5 Pro", + "id": "arcee-ai/trinity-large", + "name": "Trinity Large", + "display_name": "Trinity Large", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 15, - "output": 120 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "openai/gpt-5.1-2025-11-13", - "name": "GPT-5.1 (2025-11-13)", - "display_name": "GPT-5.1 (2025-11-13)", + "id": "meganova-ai/manta-flash-1.0", + "name": "Manta Flash 1.0", + "display_name": "Manta Flash 1.0", "modalities": { "input": [ "text" @@ -21318,80 +20584,57 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-12-20", + "last_updated": "2025-12-20", "cost": { - "input": 1.25, - "output": 10 + "input": 0.02, + "output": 0.16 }, "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "meganova-ai/manta-pro-1.0", + "name": "Manta Pro 1.0", + "display_name": "Manta Pro 1.0", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 32768 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "release_date": "2025-12-20", + "last_updated": "2025-12-20", "cost": { - "input": 2.499, - "output": 9.996 + "input": 0.060000000000000005, + "output": 0.5 }, "type": "chat" }, { - "id": "openai/o3-mini-low", - "name": "OpenAI o3-mini (Low)", - "display_name": "OpenAI o3-mini (Low)", + "id": "meganova-ai/manta-mini-1.0", + "name": "Manta Mini 1.0", + "display_name": "Manta Mini 1.0", "modalities": { "input": [ "text" @@ -21401,96 +20644,57 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "release_date": "2025-12-20", + "last_updated": "2025-12-20", "cost": { - "input": 9.996, - "output": 19.992 + "input": 0.02, + "output": 0.16 }, "type": "chat" }, { - "id": "openai/gpt-5", - "name": "GPT 5", - "display_name": "GPT 5", + "id": "LatitudeGames/Wayfarer-Large-70B-Llama-3.3", + "name": "Llama 3.3 70B Wayfarer", + "display_name": "Llama 3.3 70B Wayfarer", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-02-20", + "last_updated": "2025-02-20", "cost": { - "input": 1.25, - "output": 10 + "input": 0.700000007, + "output": 0.700000007 }, "type": "chat" }, { - "id": "openai/gpt-oss-safeguard-20b", - "name": "GPT OSS Safeguard 20B", - "display_name": "GPT OSS Safeguard 20B", + "id": "essentialai/rnj-1-instruct", + "name": "RNJ-1 Instruct 8B", + "display_name": "RNJ-1 Instruct 8B", "modalities": { "input": [ "text" @@ -21501,27 +20705,26 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-10-29", - "last_updated": "2025-10-29", + "release_date": "2025-12-13", + "last_updated": "2025-12-13", "cost": { - "input": 0.075, - "output": 0.3 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "openai/o3-pro-2025-06-10", - "name": "OpenAI o3-pro (2025-06-10)", - "display_name": "OpenAI o3-pro (2025-06-10)", + "id": "abacusai/Dracarys-72B-Instruct", + "name": "Llama 3.1 70B Dracarys 2", + "display_name": "Llama 3.1 70B Dracarys 2", "modalities": { "input": [ "text" @@ -21531,142 +20734,130 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 16384, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-06-10", - "last_updated": "2025-06-10", + "release_date": "2025-08-02", + "last_updated": "2025-08-02", "cost": { - "input": 9.996, - "output": 19.992 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "alibaba/qwen3.6-flash", + "name": "Qwen3.6 Flash", + "display_name": "Qwen3.6 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 991800, + "output": 65536 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.05, - "output": 0.25 + "input": 0.19, + "output": 1.16 }, "type": "chat" }, { - "id": "openai/gpt-5-chat-latest", - "name": "GPT 5 Chat", - "display_name": "GPT 5 Chat", + "id": "MiniMaxAI/MiniMax-M1-80k", + "name": "MiniMax M1 80K", + "display_name": "MiniMax M1 80K", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 131072 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-06-16", + "last_updated": "2025-06-16", "cost": { - "input": 1.25, - "output": 10 + "input": 0.6052, + "output": 2.4225000000000003 }, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "GPT 4.1", - "display_name": "GPT 4.1", + "id": "allenai/olmo-3.1-32b-instruct", + "name": "Olmo 3.1 32B Instruct", + "display_name": "Olmo 3.1 32B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 65536, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-10", - "last_updated": "2025-09-10", + "release_date": "2026-01-25", + "last_updated": "2026-01-25", "cost": { - "input": 2, - "output": 8 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT 4.1 Mini", - "display_name": "GPT 4.1 Mini", + "id": "allenai/molmo-2-8b", + "name": "Molmo 2 8B", + "display_name": "Molmo 2 8B", "modalities": { "input": [ "text", @@ -21677,8 +20868,8 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 36864, + "output": 36864 }, "tool_call": false, "reasoning": { @@ -21686,75 +20877,52 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "cost": { - "input": 0.4, - "output": 1.6 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex", - "name": "GPT 5.1 Codex", - "display_name": "GPT 5.1 Codex", + "id": "allenai/olmo-3.1-32b-think", + "name": "Olmo 3.1 32B Think", + "display_name": "Olmo 3.1 32B Think", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 65536, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2026-01-25", + "last_updated": "2026-01-25", "cost": { - "input": 1.25, - "output": 10 + "input": 0.15, + "output": 0.5 }, "type": "chat" }, { - "id": "openai/gpt-4o-2024-11-20", - "name": "GPT-4o (2024-11-20)", - "display_name": "GPT-4o (2024-11-20)", + "id": "allenai/olmo-3-32b-think", + "name": "Olmo 3 32B Think", + "display_name": "Olmo 3 32B Think", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -21762,26 +20930,27 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-11-20", - "last_updated": "2024-11-20", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { - "input": 2.5, - "output": 10 + "input": 0.3, + "output": 0.44999999999999996 }, "type": "chat" }, { - "id": "VongolaChouko/Starcannon-Unleashed-12B-v1.0", - "name": "Mistral Nemo Starcannon 12b v1", - "display_name": "Mistral Nemo Starcannon 12b v1", + "id": "cognitivecomputations/dolphin-2.9.2-qwen2-72b", + "name": "Dolphin 72b", + "display_name": "Dolphin 72b", "modalities": { "input": [ "text" @@ -21791,8 +20960,8 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 8192, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -21800,18 +20969,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "release_date": "2025-02-27", + "last_updated": "2025-02-27", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "amazon/nova-lite-v1", - "name": "Amazon Nova Lite 1.0", - "display_name": "Amazon Nova Lite 1.0", + "id": "Steelskull/L3.3-Electra-R1-70b", + "name": "Steelskull Electra R1 70b", + "display_name": "Steelskull Electra R1 70b", "modalities": { "input": [ "text" @@ -21821,8 +20990,8 @@ ] }, "limit": { - "context": 300000, - "output": 5120 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -21830,18 +20999,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.0595, - "output": 0.238 + "input": 0.69989, + "output": 0.69989 }, "type": "chat" }, { - "id": "amazon/nova-pro-v1", - "name": "Amazon Nova Pro 1.0", - "display_name": "Amazon Nova Pro 1.0", + "id": "Steelskull/L3.3-MS-Nevoria-70b", + "name": "Steelskull Nevoria 70b", + "display_name": "Steelskull Nevoria 70b", "modalities": { "input": [ "text" @@ -21851,8 +21020,8 @@ ] }, "limit": { - "context": 300000, - "output": 32000 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -21860,18 +21029,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.7989999999999999, - "output": 3.1959999999999997 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "amazon/nova-2-lite-v1", - "name": "Amazon Nova 2 Lite", - "display_name": "Amazon Nova 2 Lite", + "id": "Steelskull/L3.3-Nevoria-R1-70b", + "name": "Steelskull Nevoria R1 70b", + "display_name": "Steelskull Nevoria R1 70b", "modalities": { "input": [ "text" @@ -21881,8 +21050,8 @@ ] }, "limit": { - "context": 1000000, - "output": 65535 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -21890,18 +21059,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.5099999999999999, - "output": 4.25 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "amazon/nova-micro-v1", - "name": "Amazon Nova Micro 1.0", - "display_name": "Amazon Nova Micro 1.0", + "id": "Steelskull/L3.3-MS-Evayale-70B", + "name": "Evayale 70b ", + "display_name": "Evayale 70b ", "modalities": { "input": [ "text" @@ -21911,8 +21080,8 @@ ] }, "limit": { - "context": 128000, - "output": 5120 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -21920,18 +21089,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.0357, - "output": 0.1394 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "Sao10K/L3.3-70B-Euryale-v2.3", - "name": "Llama 3.3 70B Euryale", - "display_name": "Llama 3.3 70B Euryale", + "id": "Steelskull/L3.3-MS-Evalebis-70b", + "name": "MS Evalebis 70b", + "display_name": "MS Evalebis 70b", "modalities": { "input": [ "text" @@ -21941,7 +21110,7 @@ ] }, "limit": { - "context": 20480, + "context": 16384, "output": 16384 }, "tool_call": false, @@ -21959,9 +21128,9 @@ "type": "chat" }, { - "id": "Sao10K/L3.1-70B-Euryale-v2.2", - "name": "Llama 3.1 70B Euryale", - "display_name": "Llama 3.1 70B Euryale", + "id": "Steelskull/L3.3-Cu-Mai-R1-70b", + "name": "Llama 3.3 70B Cu Mai", + "display_name": "Llama 3.3 70B Cu Mai", "modalities": { "input": [ "text" @@ -21971,7 +21140,7 @@ ] }, "limit": { - "context": 20480, + "context": 16384, "output": 16384 }, "tool_call": false, @@ -21980,18 +21149,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.306, - "output": 0.357 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "Sao10K/L3.1-70B-Hanami-x1", - "name": "Llama 3.1 70B Hanami", - "display_name": "Llama 3.1 70B Hanami", + "id": "dmind/dmind-1", + "name": "DMind-1", + "display_name": "DMind-1", "modalities": { "input": [ "text" @@ -22001,8 +21170,8 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 32768, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -22010,18 +21179,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.3, + "output": 0.6 }, "type": "chat" }, { - "id": "Sao10K/L3-8B-Stheno-v3.2", - "name": "Sao10K Stheno 8b", - "display_name": "Sao10K Stheno 8b", + "id": "dmind/dmind-1-mini", + "name": "DMind-1-Mini", + "display_name": "DMind-1-Mini", "modalities": { "input": [ "text" @@ -22031,7 +21200,7 @@ ] }, "limit": { - "context": 16384, + "context": 32768, "output": 8192 }, "tool_call": false, @@ -22040,18 +21209,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-11-29", - "last_updated": "2024-11-29", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 0.2006, - "output": 0.2006 + "input": 0.2, + "output": 0.4 }, "type": "chat" }, { - "id": "LatitudeGames/Wayfarer-Large-70B-Llama-3.3", - "name": "Llama 3.3 70B Wayfarer", - "display_name": "Llama 3.3 70B Wayfarer", + "id": "xiaomi/mimo-v2-flash-thinking-original", + "name": "MiMo V2 Flash (Thinking) Original", + "display_name": "MiMo V2 Flash (Thinking) Original", "modalities": { "input": [ "text" @@ -22061,8 +21230,8 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 256000, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -22070,18 +21239,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-20", - "last_updated": "2025-02-20", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.700000007, - "output": 0.700000007 + "input": 0.102, + "output": 0.306 }, "type": "chat" }, { - "id": "z-ai/glm-4.6:thinking", - "name": "GLM 4.6 Thinking", - "display_name": "GLM 4.6 Thinking", + "id": "xiaomi/mimo-v2-flash", + "name": "MiMo V2 Flash", + "display_name": "MiMo V2 Flash", "modalities": { "input": [ "text" @@ -22091,60 +21260,57 @@ ] }, "limit": { - "context": 200000, - "output": 65535 + "context": 256000, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.4, - "output": 1.5 + "input": 0.102, + "output": 0.306 }, "type": "chat" }, { - "id": "z-ai/glm-4.5v", - "name": "GLM 4.5V", - "display_name": "GLM 4.5V", + "id": "xiaomi/mimo-v2-flash-thinking", + "name": "MiMo V2 Flash (Thinking)", + "display_name": "MiMo V2 Flash (Thinking)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 96000 + "context": 256000, + "output": 32768 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-22", - "last_updated": "2025-11-22", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.6, - "output": 1.7999999999999998 + "input": 0.102, + "output": 0.306 }, "type": "chat" }, { - "id": "z-ai/glm-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "xiaomi/mimo-v2-flash-original", + "name": "MiMo V2 Flash Original", + "display_name": "MiMo V2 Flash Original", "modalities": { "input": [ "text" @@ -22154,58 +21320,50 @@ ] }, "limit": { - "context": 200000, - "output": 65535 + "context": 256000, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.4, - "output": 1.5 + "input": 0.102, + "output": 0.306 }, "type": "chat" }, { - "id": "z-ai/glm-4.5v:thinking", - "name": "GLM 4.5V Thinking", - "display_name": "GLM 4.5V Thinking", + "id": "baidu/ernie-4.5-300b-a47b", + "name": "ERNIE 4.5 300B", + "display_name": "ERNIE 4.5 300B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 96000 + "context": 131072, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-22", - "last_updated": "2025-11-22", + "release_date": "2025-06-30", + "last_updated": "2025-06-30", "cost": { - "input": 0.6, - "output": 1.7999999999999998 + "input": 0.35, + "output": 1.15 }, "type": "chat" }, @@ -22241,9 +21399,9 @@ "type": "chat" }, { - "id": "baidu/ernie-4.5-300b-a47b", - "name": "ERNIE 4.5 300B", - "display_name": "ERNIE 4.5 300B", + "id": "stepfun-ai/step-3.5-flash", + "name": "Step 3.5 Flash", + "display_name": "Step 3.5 Flash", "modalities": { "input": [ "text" @@ -22253,27 +21411,28 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 256000, + "output": 256000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-06-30", - "last_updated": "2025-06-30", + "release_date": "2026-02-02", + "last_updated": "2026-02-02", "cost": { - "input": 0.35, - "output": 1.15 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "dmind/dmind-1", - "name": "DMind-1", - "display_name": "DMind-1", + "id": "stepfun-ai/step-3.5-flash:thinking", + "name": "Step 3.5 Flash Thinking", + "display_name": "Step 3.5 Flash Thinking", "modalities": { "input": [ "text" @@ -22283,27 +21442,28 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 256000, + "output": 256000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "release_date": "2026-02-02", + "last_updated": "2026-02-02", "cost": { - "input": 0.3, - "output": 0.6 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "dmind/dmind-1-mini", - "name": "DMind-1-Mini", - "display_name": "DMind-1-Mini", + "id": "miromind-ai/mirothinker-v1.5-235b", + "name": "MiroThinker v1.5 235B", + "display_name": "MiroThinker v1.5 235B", "modalities": { "input": [ "text" @@ -22314,7 +21474,7 @@ }, "limit": { "context": 32768, - "output": 8192 + "output": 4000 }, "tool_call": false, "reasoning": { @@ -22322,18 +21482,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "release_date": "2026-01-07", + "last_updated": "2026-01-07", "cost": { - "input": 0.2, - "output": 0.4 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "Infermatic/MN-12B-Inferor-v0.0", - "name": "Mistral Nemo Inferor 12B", - "display_name": "Mistral Nemo Inferor 12B", + "id": "tngtech/tng-r1t-chimera", + "name": "TNG R1T Chimera", + "display_name": "TNG R1T Chimera", "modalities": { "input": [ "text" @@ -22343,8 +21503,8 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 128000, + "output": 65536 }, "tool_call": false, "reasoning": { @@ -22352,18 +21512,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "release_date": "2025-11-26", + "last_updated": "2025-11-26", "cost": { - "input": 0.25499999999999995, - "output": 0.49299999999999994 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "meituan-longcat/LongCat-Flash-Chat-FP8", - "name": "LongCat Flash", - "display_name": "LongCat Flash", + "id": "tngtech/DeepSeek-TNG-R1T2-Chimera", + "name": "DeepSeek TNG R1T2 Chimera", + "display_name": "DeepSeek TNG R1T2 Chimera", "modalities": { "input": [ "text" @@ -22374,26 +21534,35 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-31", - "last_updated": "2025-08-31", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.15, - "output": 0.7 + "input": 0.31, + "output": 0.31 }, "type": "chat" - }, + } + ] + }, + "io-net": { + "id": "io-net", + "name": "IO.NET", + "display_name": "IO.NET", + "api": "https://api.intelligence.io.solutions/api/v1", + "doc": "https://io.net/docs/guides/intelligence/io-intelligence", + "models": [ { - "id": "meganova-ai/manta-mini-1.0", - "name": "Manta Mini 1.0", - "display_name": "Manta Mini 1.0", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ "text" @@ -22403,27 +21572,43 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-20", - "last_updated": "2025-12-20", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-28", "cost": { - "input": 0.02, - "output": 0.16 + "input": 2, + "output": 8.75, + "cache_read": 1, + "cache_write": 4 }, "type": "chat" }, { - "id": "meganova-ai/manta-pro-1.0", - "name": "Manta Pro 1.0", - "display_name": "Manta Pro 1.0", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -22434,26 +21619,42 @@ }, "limit": { "context": 32768, - "output": 32768 + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-12-20", - "last_updated": "2025-12-20", + "knowledge": "2024-08", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.060000000000000005, - "output": 0.5 + "input": 0.55, + "output": 2.25, + "cache_read": 0.275, + "cache_write": 1.1 }, "type": "chat" }, { - "id": "meganova-ai/manta-flash-1.0", - "name": "Manta Flash 1.0", - "display_name": "Manta Flash 1.0", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -22463,27 +21664,31 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 32768, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-12-20", - "last_updated": "2025-12-20", + "knowledge": "2024-08", + "release_date": "2024-09-05", + "last_updated": "2024-09-05", "cost": { - "input": 0.02, - "output": 0.16 + "input": 0.39, + "output": 1.9, + "cache_read": 0.195, + "cache_write": 0.78 }, "type": "chat" }, { - "id": "minimax/minimax-m2.7", - "name": "MiniMax M2.7", - "display_name": "MiniMax M2.7", + "id": "openai/gpt-oss-20b", + "name": "GPT-OSS 20B", + "display_name": "GPT-OSS 20B", "modalities": { "input": [ "text" @@ -22493,70 +21698,75 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 64000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.03, + "output": 0.14, + "cache_read": 0.015, + "cache_write": 0.06 }, "type": "chat" }, { - "id": "minimax/minimax-01", - "name": "MiniMax 01", - "display_name": "MiniMax 01", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS 120B", + "display_name": "GPT-OSS 120B", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000192, - "output": 16384 + "context": 131072, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-01-15", - "last_updated": "2025-01-15", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.1394, - "output": 1.1219999999999999 + "input": 0.04, + "output": 0.4, + "cache_read": 0.02, + "cache_write": 0.08 }, "type": "chat" }, { - "id": "minimax/minimax-m2.1", - "name": "MiniMax M2.1", - "display_name": "MiniMax M2.1", + "id": "zai-org/GLM-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ "text" @@ -22567,12 +21777,12 @@ }, "limit": { "context": 200000, - "output": 131072 + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -22581,18 +21791,21 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-19", - "last_updated": "2025-12-19", + "knowledge": "2024-10", + "release_date": "2024-11-15", + "last_updated": "2024-11-15", "cost": { - "input": 0.33, - "output": 1.32 + "input": 0.4, + "output": 1.75, + "cache_read": 0.2, + "cache_write": 0.8 }, "type": "chat" }, { - "id": "minimax/minimax-m2-her", - "name": "MiniMax M2-her", - "display_name": "MiniMax M2-her", + "id": "Intel/Qwen3-Coder-480B-A35B-Instruct-int4-mixed-ar", + "name": "Qwen 3 Coder 480B", + "display_name": "Qwen 3 Coder 480B", "modalities": { "input": [ "text" @@ -22602,27 +21815,31 @@ ] }, "limit": { - "context": 65532, - "output": 2048 + "context": 106000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-01-24", - "last_updated": "2026-01-24", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-15", + "last_updated": "2025-01-15", "cost": { - "input": 0.30200000000000005, - "output": 1.2069999999999999 + "input": 0.22, + "output": 0.95, + "cache_read": 0.11, + "cache_write": 0.44 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "mistralai/Devstral-Small-2505", + "name": "Devstral Small 2505", + "display_name": "Devstral Small 2505", "modalities": { "input": [ "text" @@ -22632,163 +21849,100 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2024-12", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.05, + "output": 0.22, + "cache_read": 0.025, + "cache_write": 0.1 }, "type": "chat" }, { - "id": "qwen/Qwen3.6-35B-A3B:thinking", - "name": "Qwen3.6 35B A3B Thinking", - "display_name": "Qwen3.6 35B A3B Thinking", + "id": "mistralai/Mistral-Large-Instruct-2411", + "name": "Mistral Large Instruct 2411", + "display_name": "Mistral Large Instruct 2411", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-19", - "last_updated": "2026-04-21", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.29, - "output": 1.74 + "input": 2, + "output": 6, + "cache_read": 1, + "cache_write": 4 }, "type": "chat" }, { - "id": "qwen/qwen3.5-397b-a17b", - "name": "Qwen3.5 397B A17B", - "display_name": "Qwen3.5 397B A17B", + "id": "mistralai/Mistral-Nemo-Instruct-2407", + "name": "Mistral Nemo Instruct 2407", + "display_name": "Mistral Nemo Instruct 2407", "modalities": { "input": [ - "text", - "image", - "video" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 258048, - "output": 65536 - }, - "tool_call": false, - "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-16", - "last_updated": "2026-02-16", - "cost": { - "input": 0.6, - "output": 3.6 - }, - "type": "chat" - }, - { - "id": "qwen/Qwen3.6-35B-A3B", - "name": "Qwen3.6 35B A3B", - "display_name": "Qwen3.6 35B A3B", - "modalities": { - "input": [ - "text", - "image", - "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-04-17", - "last_updated": "2026-04-21", + "knowledge": "2024-05", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.29, - "output": 1.74 + "input": 0.02, + "output": 0.04, + "cache_read": 0.01, + "cache_write": 0.04 }, "type": "chat" }, { - "id": "unsloth/gemma-3-1b-it", - "name": "Gemma 3 1B IT", - "display_name": "Gemma 3 1B IT", + "id": "mistralai/Magistral-Small-2506", + "name": "Magistral Small 2506", + "display_name": "Magistral Small 2506", "modalities": { "input": [ "text" @@ -22799,61 +21953,68 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", + "knowledge": "2025-01", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 0.1003, - "output": 0.1003 + "input": 0.5, + "output": 1.5, + "cache_read": 0.25, + "cache_write": 1 }, "type": "chat" }, { - "id": "unsloth/gemma-3-12b-it", - "name": "Gemma 3 12B IT", - "display_name": "Gemma 3 12B IT", + "id": "meta-llama/Llama-3.2-90B-Vision-Instruct", + "name": "Llama 3.2 90B Vision Instruct", + "display_name": "Llama 3.2 90B Vision Instruct", "modalities": { "input": [ "text", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 131072 + "context": 16000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.272, - "output": 0.272 + "input": 0.35, + "output": 0.4, + "cache_read": 0.175, + "cache_write": 0.7 }, "type": "chat" }, { - "id": "unsloth/gemma-3-4b-it", - "name": "Gemma 3 4B IT", - "display_name": "Gemma 3 4B IT", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" @@ -22861,57 +22022,65 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.2006, - "output": 0.2006 + "input": 0.13, + "output": 0.38, + "cache_read": 0.065, + "cache_write": 0.26 }, "type": "chat" }, { - "id": "unsloth/gemma-3-27b-it", - "name": "Gemma 3 27B IT", - "display_name": "Gemma 3 27B IT", + "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", + "name": "Llama 4 Maverick 17B 128E Instruct", + "display_name": "Llama 4 Maverick 17B 128E Instruct", "modalities": { "input": [ "text", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 96000 + "context": 430000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-15", + "last_updated": "2025-01-15", "cost": { - "input": 0.2992, - "output": 0.2992 + "input": 0.15, + "output": 0.6, + "cache_read": 0.075, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-9B-0414", - "name": "GLM Z1 9B 0414", - "display_name": "GLM Z1 9B 0414", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen 3 235B Thinking", + "display_name": "Qwen 3 235B Thinking", "modalities": { "input": [ "text" @@ -22921,27 +22090,43 @@ ] }, "limit": { - "context": 32000, - "output": 8000 + "context": 262144, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.11, + "output": 0.6, + "cache_read": 0.055, + "cache_write": 0.22 }, "type": "chat" }, { - "id": "THUDM/GLM-4-9B-0414", - "name": "GLM 4 9B 0414", - "display_name": "GLM 4 9B 0414", + "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen 3 Next 80B Instruct", + "display_name": "Qwen 3 Next 80B Instruct", "modalities": { "input": [ "text" @@ -22951,30 +22136,35 @@ ] }, "limit": { - "context": 32000, - "output": 8000 + "context": 262144, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-10", + "last_updated": "2025-01-10", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.1, + "output": 0.8, + "cache_read": 0.05, + "cache_write": 0.2 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-Rumination-32B-0414", - "name": "GLM Z1 Rumination 32B 0414", - "display_name": "GLM Z1 Rumination 32B 0414", + "id": "Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen 2.5 VL 32B Instruct", + "display_name": "Qwen 2.5 VL 32B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -22982,26 +22172,39 @@ }, "limit": { "context": 32000, - "output": 65536 + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "open_weights": true, + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.05, + "output": 0.22, + "cache_read": 0.025, + "cache_write": 0.1 }, "type": "chat" - }, + } + ] + }, + "inception": { + "id": "inception", + "name": "Inception", + "display_name": "Inception", + "api": "https://api.inceptionlabs.ai/v1/", + "doc": "https://platform.inceptionlabs.ai/docs", + "models": [ { - "id": "THUDM/GLM-4-32B-0414", - "name": "GLM 4 32B 0414", - "display_name": "GLM 4 32B 0414", + "id": "mercury-edit-2", + "name": "Mercury Edit 2", + "display_name": "Mercury Edit 2", "modalities": { "input": [ "text" @@ -23012,26 +22215,29 @@ }, "limit": { "context": 128000, - "output": 65536 + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2026-03-30", + "last_updated": "2026-03-30", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.25, + "output": 0.75, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-32B-0414", - "name": "GLM Z1 32B 0414", - "display_name": "GLM Z1 32B 0414", + "id": "mercury-2", + "name": "Mercury 2", + "display_name": "Mercury 2", "modalities": { "input": [ "text" @@ -23042,39 +22248,52 @@ }, "limit": { "context": 128000, - "output": 65536 + "output": 50000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "knowledge": "2025-01-01", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.25, + "output": 0.75, + "cache_read": 0.025 }, "type": "chat" - }, + } + ] + }, + "submodel": { + "id": "submodel", + "name": "submodel", + "display_name": "submodel", + "api": "https://llm.submodel.ai/v1", + "doc": "https://submodel.gitbook.io", + "models": [ { - "id": "google/gemini-3-flash-preview", - "name": "Gemini 3 Flash (Preview)", - "display_name": "Gemini 3 Flash (Preview)", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 75000, + "output": 163840 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -23083,36 +22302,28 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { "input": 0.5, - "output": 3 + "output": 2.15 }, "type": "chat" }, { - "id": "google/gemini-flash-1.5", - "name": "Gemini 1.5 Flash", - "display_name": "Gemini 1.5 Flash", + "id": "deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text" @@ -23122,120 +22333,97 @@ ] }, "limit": { - "context": 2000000, - "output": 8192 + "context": 75000, + "output": 163840 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2024-05-14", - "last_updated": "2024-05-14", + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.0748, - "output": 0.306 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "google/gemini-3-flash-preview-thinking", - "name": "Gemini 3 Flash Thinking", - "display_name": "Gemini 3 Flash Thinking", + "id": "deepseek-ai/DeepSeek-V3-0324", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 75000, + "output": 163840 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.5, - "output": 3 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 131072, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-01-26", - "last_updated": "2026-01-26", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.3, - "output": 1.9 + "input": 0.1, + "output": 0.5 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "zai-org/GLM-4.5-Air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", "modalities": { "input": [ "text" @@ -23245,27 +22433,28 @@ ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 131072, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "open_weights": true, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { "input": 0.1, - "output": 2 + "output": 0.5 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking-original", - "name": "Kimi K2 Thinking Original", - "display_name": "Kimi K2 Thinking Original", + "id": "zai-org/GLM-4.5-FP8", + "name": "GLM 4.5 FP8", + "display_name": "GLM 4.5 FP8", "modalities": { "input": [ "text" @@ -23275,28 +22464,29 @@ ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "open_weights": true, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.6, - "output": 2.5 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-instruct-0711", - "name": "Kimi K2 0711", - "display_name": "Kimi K2 0711", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -23306,58 +22496,71 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 262144 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.1, - "output": 2 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "moonshotai/Kimi-Dev-72B", - "name": "Kimi Dev 72B", - "display_name": "Kimi Dev 72B", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 262144, "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.4, - "output": 0.4 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking-turbo-original", - "name": "Kimi K2 Thinking Turbo Original", - "display_name": "Kimi K2 Thinking Turbo Original", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -23367,28 +22570,37 @@ ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 262144, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "open_weights": true, + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 1.15, - "output": 8 + "input": 0.2, + "output": 0.3 }, "type": "chat" - }, + } + ] + }, + "requesty": { + "id": "requesty", + "name": "Requesty", + "display_name": "Requesty", + "api": "https://router.requesty.ai/v1", + "doc": "https://requesty.ai/solution/llm-routing/models", + "models": [ { - "id": "moonshotai/kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "openai/gpt-5.1-codex-mini", + "name": "GPT-5.1-Codex-Mini", + "display_name": "GPT-5.1-Codex-Mini", "modalities": { "input": [ "text", @@ -23399,32 +22611,52 @@ ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 400000, + "output": 100000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-16", - "last_updated": "2026-04-21", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.53, - "output": 2.73 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.6:thinking", - "name": "Kimi K2.6 Thinking", - "display_name": "Kimi K2.6 Thinking", + "id": "openai/gpt-5.2-pro", + "name": "GPT-5.2 Pro", + "display_name": "GPT-5.2 Pro", "modalities": { "input": [ "text", @@ -23435,99 +22667,106 @@ ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 400000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-16", - "last_updated": "2026-04-21", - "cost": { - "input": 0.53, - "output": 2.73 - }, - "type": "chat" - }, - { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 262144 - }, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.4, - "output": 2 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "openai/gpt-5-codex", + "name": "GPT-5 Codex", + "display_name": "GPT-5 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 262144 + "context": 400000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "knowledge": "2024-10-01", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.3, - "output": 1.2 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.5:thinking", - "name": "Kimi K2.5 Thinking", - "display_name": "Kimi K2.5 Thinking", + "id": "openai/gpt-5.1-chat", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", "modalities": { "input": [ "text", @@ -23538,9 +22777,10 @@ ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 128000, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -23548,108 +22788,147 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-01-26", - "last_updated": "2026-01-26", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.3, - "output": 1.9 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "Tongyi-Zhiwen/QwenLong-L1-32B", - "name": "QwenLong L1 32B", - "display_name": "QwenLong L1 32B", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1 Mini", + "display_name": "GPT-4.1 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 40960 - }, - "tool_call": false, + "context": 1047576, + "output": 32768 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-25", - "last_updated": "2025-01-25", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.13999999999999999, - "output": 0.6 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "nothingiisreal/L3.1-70B-Celeste-V0.1-BF16", - "name": "Llama 3.1 70B Celeste v0.1", - "display_name": "Llama 3.1 70B Celeste v0.1", + "id": "openai/gpt-5-image", + "name": "GPT-5 Image", + "display_name": "GPT-5 Image", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2024-10-01", + "release_date": "2025-10-14", + "last_updated": "2025-10-14", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "aion-labs/aion-1.0", - "name": "Aion 1.0", - "display_name": "Aion 1.0", + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-02-01", - "last_updated": "2025-02-01", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 3.995, - "output": 7.99 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "aion-labs/aion-rp-llama-3.1-8b", - "name": "Llama 3.1 8b (uncensored)", - "display_name": "Llama 3.1 8b (uncensored)", + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ "text" @@ -23659,131 +22938,212 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 16000, + "output": 4000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.2006, - "output": 0.2006 + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "aion-labs/aion-1.0-mini", - "name": "Aion 1.0 mini (DeepSeek)", - "display_name": "Aion 1.0 mini (DeepSeek)", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o Mini", + "display_name": "GPT-4o Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-02-20", - "last_updated": "2025-02-20", + "knowledge": "2024-10", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.7989999999999999, - "output": 1.394 + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "Alibaba-NLP/Tongyi-DeepResearch-30B-A3B", - "name": "Tongyi DeepResearch 30B A3B", - "display_name": "Tongyi DeepResearch 30B A3B", + "id": "openai/gpt-5.1-codex-max", + "name": "GPT-5.1-Codex-Max", + "display_name": "GPT-5.1-Codex-Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.08, - "output": 0.24000000000000002 + "input": 1.1, + "output": 9, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M1-80k", - "name": "MiniMax M1 80K", - "display_name": "MiniMax M1 80K", + "id": "openai/gpt-5.4-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 1050000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-06-16", - "last_updated": "2025-06-16", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.6052, - "output": 2.4225000000000003 + "input": 30, + "output": 180, + "cache_read": 30 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6:thinking:low", - "name": "Claude 4.6 Opus Thinking Low", - "display_name": "Claude 4.6 Opus Thinking Low", + "id": "openai/o4-mini", + "name": "o4 Mini", + "display_name": "o4 Mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 200000, + "output": 100000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -23793,56 +23153,46 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, + "mode": "effort", "effort": "medium", "effort_options": [ "low", "medium", "high" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2024-06", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 4.998, - "output": 25.007 + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6", - "name": "Claude 4.6 Opus", - "display_name": "Claude 4.6 Opus", + "id": "openai/gpt-5.1-codex", + "name": "GPT-5.1-Codex", + "display_name": "GPT-5.1-Codex", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -23852,56 +23202,53 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", + "mode": "effort", + "effort": "none", "effort_options": [ + "none", "low", "medium", "high" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 4.998, - "output": 25.007 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.6:thinking", - "name": "Claude Sonnet 4.6 Thinking", - "display_name": "Claude Sonnet 4.6 Thinking", + "id": "openai/gpt-5.2-codex", + "name": "GPT-5.2-Codex", + "display_name": "GPT-5.2-Codex", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -23911,57 +23258,87 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, + "mode": "effort", "effort": "medium", "effort_options": [ "low", "medium", - "high" + "high", + "xhigh" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 2.992, - "output": 14.993999999999998 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6:thinking:max", - "name": "Claude 4.6 Opus Thinking Max", - "display_name": "Claude 4.6 Opus Thinking Max", + "id": "openai/gpt-5-chat", + "name": "GPT-5 Chat (latest)", + "display_name": "GPT-5 Chat (latest)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.25, + "output": 10 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32000 + }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -23971,42 +23348,39 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, + "mode": "effort", "effort": "medium", "effort_options": [ + "minimal", "low", "medium", "high" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 4.998, - "output": 25.007 + "input": 0.25, + "output": 2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6:thinking:medium", - "name": "Claude 4.6 Opus Thinking Medium", - "display_name": "Claude 4.6 Opus Thinking Medium", + "id": "openai/gpt-5.3-codex", + "name": "GPT-5.3-Codex", + "display_name": "GPT-5.3-Codex", "modalities": { "input": [ "text", @@ -24018,9 +23392,10 @@ ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -24030,42 +23405,198 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", + "modalities": { + "input": [ + "text", + "audio", + "image", + "video" + ], + "output": [ + "text", + "audio", + "image" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", "effort": "medium", "effort_options": [ + "minimal", "low", "medium", "high" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.13 + }, + "type": "chat" + }, + { + "id": "anthropic/claude-3-7-sonnet", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", "continuation": [ "thinking_blocks" ], "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + "Anthropic uses thinking budget tokens" ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2024-01", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 4.998, - "output": 25.007 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "anthropic/claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 62000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-01", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "cost": { + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + }, + "type": "chat" + }, + { + "id": "anthropic/claude-opus-4", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ "text", @@ -24076,10 +23607,47 @@ "text" ] }, + "limit": { + "context": 200000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "type": "chat" + }, + { + "id": "anthropic/claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, "limit": { "context": 1000000, "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -24117,15 +23685,35 @@ "release_date": "2026-02-17", "last_updated": "2026-02-17", "cost": { - "input": 2.992, - "output": 14.993999999999998 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5 + } }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6:thinking", - "name": "Claude 4.6 Opus Thinking", - "display_name": "Claude 4.6 Opus Thinking", + "id": "anthropic/claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", @@ -24140,15 +23728,16 @@ "context": 1000000, "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "mixed", "budget": { "min": 1024, @@ -24173,168 +23762,295 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-05-31", "release_date": "2026-02-05", "last_updated": "2026-02-05", "cost": { - "input": 4.998, - "output": 25.007 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "tiers": [ + { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5 + } }, "type": "chat" }, { - "id": "abacusai/Dracarys-72B-Instruct", - "name": "Llama 3.1 70B Dracarys 2", - "display_name": "Llama 3.1 70B Dracarys 2", + "id": "anthropic/claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-02", - "last_updated": "2025-08-02", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "EVA-UNIT-01/EVA-LLaMA-3.33-70B-v0.0", - "name": "EVA Llama 3.33 70B", - "display_name": "EVA Llama 3.33 70B", + "id": "google/gemini-3-pro-preview", + "name": "Gemini 3 Pro", + "display_name": "Gemini 3 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 1048576, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 2.006, - "output": 2.006 + "input": 2, + "output": 12, + "cache_read": 0.2, + "cache_write": 4.5 }, "type": "chat" }, { - "id": "EVA-UNIT-01/EVA-Qwen2.5-72B-v0.2", - "name": "EVA-Qwen2.5-72B-v0.2", - "display_name": "EVA-Qwen2.5-72B-v0.2", + "id": "google/gemini-3-flash-preview", + "name": "Gemini 3 Flash", + "display_name": "Gemini 3 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 1048576, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.7989999999999999, - "output": 0.7989999999999999 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 1 }, "type": "chat" }, { - "id": "EVA-UNIT-01/EVA-LLaMA-3.33-70B-v0.1", - "name": "EVA-LLaMA-3.33-70B-v0.1", - "display_name": "EVA-LLaMA-3.33-70B-v0.1", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 1048576, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 2.006, - "output": 2.006 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.55 }, "type": "chat" }, { - "id": "EVA-UNIT-01/EVA-Qwen2.5-32B-v0.2", - "name": "EVA-Qwen2.5-32B-v0.2", - "display_name": "EVA-Qwen2.5-32B-v0.2", + "id": "xai/grok-4", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 256000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "knowledge": "2025-01", + "release_date": "2025-09-09", + "last_updated": "2025-09-09", "cost": { - "input": 0.7989999999999999, - "output": 0.7989999999999999 + "input": 3, + "output": 15, + "cache_read": 0.75, + "cache_write": 3 }, "type": "chat" }, { - "id": "huihui-ai/DeepSeek-R1-Distill-Qwen-32B-abliterated", - "name": "DeepSeek R1 Qwen Abliterated", - "display_name": "DeepSeek R1 Qwen Abliterated", + "id": "xai/grok-4-fast", + "name": "Grok 4 Fast", + "display_name": "Grok 4 Fast", "modalities": { "input": [ "text" @@ -24344,299 +24060,485 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 2000000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2025-01", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 1.4, - "output": 1.4 - }, - "type": "chat" + "input": 0.2, + "output": 0.5, + "cache_read": 0.05, + "cache_write": 0.2 + }, + "type": "chat" }, { - "id": "huihui-ai/DeepSeek-R1-Distill-Llama-70B-abliterated", - "name": "DeepSeek R1 Llama 70B Abliterated", - "display_name": "DeepSeek R1 Llama 70B Abliterated", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.7, - "output": 0.7 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "huihui-ai/Llama-3.3-70B-Instruct-abliterated", - "name": "Llama 3.3 70B Instruct abliterated", - "display_name": "Llama 3.3 70B Instruct abliterated", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 1047576, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.7, - "output": 0.7 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "huihui-ai/Qwen2.5-32B-Instruct-abliterated", - "name": "Qwen 2.5 32B Abliterated", - "display_name": "Qwen 2.5 32B Abliterated", + "id": "openai/gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 400000, + "output": 272000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-01-06", - "last_updated": "2025-01-06", + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 0.7, - "output": 0.7 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "huihui-ai/Llama-3.1-Nemotron-70B-Instruct-HF-abliterated", - "name": "Nemotron 3.1 70B abliterated", - "display_name": "Nemotron 3.1 70B abliterated", + "id": "openai/gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 1050000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.7, - "output": 0.7 + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + }, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash-thinking-original", - "name": "MiMo V2 Flash (Thinking) Original", - "display_name": "MiMo V2 Flash (Thinking) Original", + "id": "openai/gpt-5.2-chat", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 128000, + "output": 16384 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.102, - "output": 0.306 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash-thinking", - "name": "MiMo V2 Flash (Thinking)", - "display_name": "MiMo V2 Flash (Thinking)", + "id": "anthropic/claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 1000000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.102, - "output": 0.306 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash", - "name": "MiMo V2 Flash", - "display_name": "MiMo V2 Flash", + "id": "anthropic/claude-opus-4-1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.102, - "output": 0.306 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash-original", - "name": "MiMo V2 Flash Original", - "display_name": "MiMo V2 Flash Original", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.102, - "output": 0.306 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "tngtech/DeepSeek-TNG-R1T2-Chimera", - "name": "DeepSeek TNG R1T2 Chimera", - "display_name": "DeepSeek TNG R1T2 Chimera", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1048576, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.31, - "output": 0.31 + "input": 1.25, + "output": 10, + "cache_read": 0.31, + "cache_write": 2.375, + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + }, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" - }, + } + ] + }, + "zai": { + "id": "zai", + "name": "Z.AI", + "display_name": "Z.AI", + "api": "https://api.z.ai/api/paas/v4", + "doc": "https://docs.z.ai/guides/overview/pricing", + "models": [ { - "id": "tngtech/tng-r1t-chimera", - "name": "TNG R1T Chimera", - "display_name": "TNG R1T Chimera", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -24646,57 +24548,90 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 200000, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-11-26", - "last_updated": "2025-11-26", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.3, - "output": 1.2 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26, + "cache_write": 0 }, "type": "chat" }, { - "id": "inflatebot/MN-12B-Mag-Mell-R1", - "name": "Mag Mell R1", - "display_name": "Mag Mell R1", + "id": "glm-5v-turbo", + "name": "GLM-5V-Turbo", + "display_name": "GLM-5V-Turbo", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 200000, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 1.2, + "output": 4, + "cache_read": 0.24, + "cache_write": 0 }, "type": "chat" }, { - "id": "failspy/Meta-Llama-3-70B-Instruct-abliterated-v3.5", - "name": "Llama 3 70B abliterated", - "display_name": "Llama 3 70B abliterated", + "id": "glm-4.7-flashx", + "name": "GLM-4.7-FlashX", + "display_name": "GLM-4.7-FlashX", "modalities": { "input": [ "text" @@ -24706,104 +24641,80 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.7, - "output": 0.7 + "input": 0.07, + "output": 0.4, + "cache_read": 0.01, + "cache_write": 0 }, "type": "chat" - } - ] - }, - "abacus": { - "id": "abacus", - "name": "Abacus", - "display_name": "Abacus", - "api": "https://routellm.abacus.ai/v1", - "doc": "https://abacus.ai/help/api", - "models": [ + }, { - "id": "gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 98304 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 1.25, - "output": 10 + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, + "cache_write": 0 }, "type": "chat" }, { - "id": "claude-opus-4-5-20251101", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "glm-4.5v", + "name": "GLM-4.5V", + "display_name": "GLM-4.5V", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 64000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -24812,33 +24723,31 @@ "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "cost": { - "input": 5, - "output": 25 + "input": 0.6, + "output": 1.8 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -24848,45 +24757,37 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.6, - "output": 3 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gemini-3.1-flash-lite-preview", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -24899,98 +24800,69 @@ "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-01", - "last_updated": "2026-03-01", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 3, - "output": 15 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "glm-4.5-flash", + "name": "GLM-4.5-Flash", + "display_name": "GLM-4.5-Flash", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -24998,50 +24870,34 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 2, - "output": 12 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gpt-5.3-chat-latest", - "name": "GPT-5.3 Chat Latest", - "display_name": "GPT-5.3 Chat Latest", + "id": "glm-5-turbo", + "name": "GLM-5-Turbo", + "display_name": "GLM-5-Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -25049,35 +24905,44 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "release_date": "2026-03-01", - "last_updated": "2026-03-01", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 1.75, - "output": 14 + "input": 1.2, + "output": 4, + "cache_read": 0.24, + "cache_write": 0 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -25088,37 +24953,31 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.5, - "output": 3 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "llama-3.3-70b-versatile", - "name": "Llama 3.3 70B Versatile", - "display_name": "Llama 3.3 70B Versatile", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -25128,97 +24987,99 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.59, - "output": 0.79 + "input": 1, + "output": 3.2, + "cache_read": 0.2, + "cache_write": 0 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.25, - "output": 2 + "input": 0.3, + "output": 0.9 }, "type": "chat" - }, + } + ] + }, + "zai-coding-plan": { + "id": "zai-coding-plan", + "name": "Z.AI Coding Plan", + "display_name": "Z.AI Coding Plan", + "api": "https://api.z.ai/api/coding/paas/v4", + "doc": "https://docs.z.ai/devpack/overview", + "models": [ { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -25227,100 +25088,68 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.05, - "output": 0.4 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 98304 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 1.75, - "output": 14 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "glm-5-turbo", + "name": "GLM-5-Turbo", + "display_name": "GLM-5-Turbo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -25328,7 +25157,7 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -25336,36 +25165,44 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 3, - "output": 15 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -25376,139 +25213,145 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 1.25, - "output": 10 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "Grok 4.1 Fast (Non-Reasoning)", - "display_name": "Grok 4.1 Fast (Non-Reasoning)", + "id": "glm-5v-turbo", + "name": "GLM-5V-Turbo", + "display_name": "GLM-5V-Turbo", "modalities": { "input": [ "text", - "image" + "image", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 16384 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-11-17", - "last_updated": "2025-11-17", + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "deepinfra": { + "id": "deepinfra", + "name": "Deep Infra", + "display_name": "Deep Infra", + "doc": "https://deepinfra.com/models", + "models": [ { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 163840, + "output": 64000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 1.75, - "output": 14 + "input": 0.5, + "output": 2.15, + "cache_read": 0.35 }, "type": "chat" }, { - "id": "o3-pro", - "name": "o3-pro", - "display_name": "o3-pro", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 163840, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -25517,65 +25360,62 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-06-10", - "last_updated": "2025-06-10", + "knowledge": "2024-12", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 20, - "output": 40 + "input": 0.26, + "output": 0.38, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "gpt-4o-mini", - "name": "GPT-4o Mini", - "display_name": "GPT-4o Mini", + "id": "moonshotai/Kimi-K2-Instruct", + "name": "Kimi K2", + "display_name": "Kimi K2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.5, + "output": 2 }, "type": "chat" }, { - "id": "qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -25586,7 +25426,7 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -25606,33 +25446,35 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-11-06", + "last_updated": "2025-11-07", "cost": { - "input": 1.2, - "output": 6 + "input": 0.47, + "output": 2 }, "type": "chat" }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262144, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -25641,47 +25483,45 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 1.1, - "output": 4.4 + "input": 0.75, + "output": 3.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -25690,108 +25530,73 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 1.75, - "output": 14 + "input": 0.5, + "output": 2.8 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.3, - "output": 2.5 + "input": 0.4, + "output": 2, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "gpt-5.2-chat-latest", - "name": "GPT-5.2 Chat Latest", - "display_name": "GPT-5.2 Chat Latest", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -25799,36 +25604,38 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2026-01-01", - "last_updated": "2026-01-01", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.75, - "output": 14 + "input": 0.03, + "output": 0.14 }, "type": "chat" }, { - "id": "gpt-5.3-codex-xhigh", - "name": "GPT-5.3 Codex XHigh", - "display_name": "GPT-5.3 Codex XHigh", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -25836,132 +25643,100 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.75, - "output": 14 + "input": 0.05, + "output": 0.24 }, "type": "chat" }, { - "id": "grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "zai-org/GLM-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-01", - "last_updated": "2025-09-01", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.2, - "output": 1.5 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "zai-org/GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 202752, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 1.25, - "output": 10 + "input": 0.43, + "output": 1.75, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "zai-org/GLM-4.7-Flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ "text" @@ -25971,10 +25746,10 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 202752, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -25983,43 +25758,39 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 1.1, - "output": 4.4 + "input": 0.06, + "output": 0.4 }, "type": "chat" }, { - "id": "grok-4-0709", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "zai-org/GLM-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 202752, "output": 16384 }, "temperature": true, @@ -26028,53 +25799,78 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 3, - "output": 15 + "input": 0.8, + "output": 2.56, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "route-llm", - "name": "Route LLM", - "display_name": "Route LLM", + "id": "zai-org/GLM-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 202752, "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 3, - "output": 15 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "qwen-2.5-coder-32b", - "name": "Qwen 2.5 Coder 32B", - "display_name": "Qwen 2.5 Coder 32B", + "id": "zai-org/GLM-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -26084,28 +25880,42 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2024-11-11", - "last_updated": "2024-11-11", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.79, - "output": 0.79 + "input": 0.43, + "output": 1.74, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "gpt-5-codex", - "name": "GPT-5 Codex", - "display_name": "GPT-5 Codex", + "id": "zai-org/GLM-4.6V", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ "text", @@ -26116,10 +25926,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -26128,44 +25938,33 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "attachment": true, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 1.25, - "output": 10 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "claude-opus-4-1-20250805", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "anthropic/claude-3-7-sonnet-latest", + "name": "Claude Sonnet 3.7 (Latest)", + "display_name": "Claude Sonnet 3.7 (Latest)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -26173,28 +25972,50 @@ }, "limit": { "context": 200000, - "output": 32000 + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-10-31", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 15, - "output": 75 + "input": 3.3, + "output": 16.5, + "cache_read": 0.33 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "anthropic/claude-4-opus", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ "text", @@ -26205,155 +26026,121 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 200000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2025-03-31", + "release_date": "2025-06-12", + "last_updated": "2025-06-12", "cost": { - "input": 2.5, - "output": 15 + "input": 16.5, + "output": 82.5 }, "type": "chat" }, { - "id": "gpt-5.1-chat-latest", - "name": "GPT-5.1 Chat Latest", - "display_name": "GPT-5.1 Chat Latest", + "id": "meta-llama/Llama-3.1-8B-Instruct", + "name": "Llama 3.1 8B", + "display_name": "Llama 3.1 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 16384 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 1.25, - "output": 10 + "input": 0.02, + "output": 0.05 }, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "meta-llama/Llama-3.1-70B-Instruct-Turbo", + "name": "Llama 3.1 70B Turbo", + "display_name": "Llama 3.1 70B Turbo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 1, - "output": 5 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "claude-sonnet-4-20250514", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", + "name": "Llama 4 Scout 17B", + "display_name": "Llama 4 Scout 17B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 10000000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-14", - "last_updated": "2025-05-14", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 3, - "output": 15 + "input": 0.08, + "output": 0.3 }, "type": "chat" }, { - "id": "kimi-k2-turbo-preview", - "name": "Kimi K2 Turbo Preview", - "display_name": "Kimi K2 Turbo Preview", + "id": "meta-llama/Llama-3.1-70B-Instruct", + "name": "Llama 3.1 70B", + "display_name": "Llama 3.1 70B", "modalities": { "input": [ "text" @@ -26363,89 +26150,87 @@ ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 131072, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-08", - "last_updated": "2025-07-08", + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.15, - "output": 8 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "meta-llama/Llama-3.1-8B-Instruct-Turbo", + "name": "Llama 3.1 8B Turbo", + "display_name": "Llama 3.1 8B Turbo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 131072, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0.02, + "output": 0.03 }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "type": "chat" + }, + { + "id": "meta-llama/Llama-3.3-70B-Instruct-Turbo", + "name": "Llama 3.3 70B Turbo", + "display_name": "Llama 3.3 70B Turbo", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 16384 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 5, - "output": 25 + "input": 0.1, + "output": 0.32 }, "type": "chat" }, { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 Nano", - "display_name": "GPT-4.1 Nano", + "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", + "name": "Llama 4 Maverick 17B FP8", + "display_name": "Llama 4 Maverick 17B FP8", "modalities": { "input": [ "text", @@ -26456,98 +26241,84 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 1000000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-20250219", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "MiniMaxAI/MiniMax-M2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 196608, + "output": 196608 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", + "interleaved": true, + "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "attachment": false, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 3, - "output": 15 + "input": 0.28, + "output": 1.2 }, "type": "chat" }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -26556,46 +26327,44 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "attachment": false, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 2, - "output": 8 + "input": 0.27, + "output": 0.95, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "MiniMaxAI/MiniMax-M2", + "name": "MiniMax M2", + "display_name": "MiniMax M2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -26604,129 +26373,129 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 1.25, - "output": 10 + "input": 0.254, + "output": 1.02 }, "type": "chat" }, { - "id": "claude-opus-4-20250514", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo", + "name": "Qwen3 Coder 480B A35B Instruct Turbo", + "display_name": "Qwen3 Coder 480B A35B Instruct Turbo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 262144, + "output": 66536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-14", - "last_updated": "2025-05-14", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 15, - "output": 75 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "Qwen/Qwen3.5-397B-A17B", + "name": "Qwen 3.5 397B A17B", + "display_name": "Qwen 3.5 397B A17B", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 262144, + "output": 81920 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-02-01", + "last_updated": "2026-04-20", "cost": { - "input": 2, - "output": 8 + "input": 0.54, + "output": 3.4 }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 Mini", - "display_name": "GPT-4.1 Mini", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 262144, + "output": 66536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { "input": 0.4, "output": 1.6 @@ -26734,130 +26503,145 @@ "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "Qwen/Qwen3.5-35B-A3B", + "name": "Qwen 3.5 35B A3B", + "display_name": "Qwen 3.5 35B A3B", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 81920 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-02-01", + "last_updated": "2026-04-20", "cost": { - "input": 1.25, - "output": 10 + "input": 0.2, + "output": 0.95 }, "type": "chat" }, { - "id": "gpt-4o-2024-11-20", - "name": "GPT-4o (2024-11-20)", - "display_name": "GPT-4o (2024-11-20)", + "id": "Qwen/Qwen3.6-35B-A3B", + "name": "Qwen3.6 35B A3B", + "display_name": "Qwen3.6 35B A3B", "modalities": { "input": [ "text", "image", - "audio" + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 81920 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-11-20", - "last_updated": "2024-11-20", + "open_weights": true, + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 2.5, - "output": 10 + "input": 0.2, + "output": 1 }, "type": "chat" }, { - "id": "grok-4-fast-non-reasoning", - "name": "Grok 4 Fast (Non-Reasoning)", - "display_name": "Grok 4 Fast (Non-Reasoning)", + "id": "deepseek-ai/DeepSeek-V4-Flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 16384 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "deepseek-ai/DeepSeek-V4-Pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -26867,8 +26651,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -26876,31 +26660,45 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.55, - "output": 1.66 + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "Qwen/QwQ-32B", - "name": "QwQ 32B", - "display_name": "QwQ 32B", + "id": "google/gemma-4-26B-A4B-it", + "name": "Gemma 4 26B", + "display_name": "Gemma 4 26B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -26908,41 +26706,31 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2024-11-28", - "last_updated": "2024-11-28", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.4, - "output": 0.4 + "input": 0.07, + "output": 0.34 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct", - "display_name": "Qwen3 235B A22B Instruct", + "id": "google/gemma-4-31B-it", + "name": "Gemma 4 31B", + "display_name": "Gemma 4 31B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 256000, "output": 8192 }, "temperature": true, @@ -26953,18 +26741,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { "input": 0.13, - "output": 0.6 + "output": 0.38 }, "type": "chat" }, { - "id": "Qwen/Qwen3-32B", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "xiaomi/mimo-v2.5-pro", + "name": "MiMo-V2.5-Pro", + "display_name": "MiMo-V2.5-Pro", "modalities": { "input": [ "text" @@ -26974,8 +26762,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1048576, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -26996,21 +26784,42 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.09, - "output": 0.29 + "input": 1, + "output": 3, + "cache_read": 0.2, + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ] }, "type": "chat" }, { - "id": "Qwen/qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "xiaomi/mimo-v2.5", + "name": "MiMo-V2.5", + "display_name": "MiMo-V2.5", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" @@ -27018,7 +26827,7 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -27026,93 +26835,123 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "release_date": "2025-07-22", - "last_updated": "2025-07-22", + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.29, - "output": 1.2 + "input": 0.4, + "output": 2, + "cache_read": 0.08, + "context_over_200k": { + "input": 0.8, + "output": 4, + "cache_read": 0.16 + }, + "tiers": [ + { + "input": 0.8, + "output": 4, + "cache_read": 0.16, + "tier": { + "type": "context", + "size": 256000 + } + } + ] }, "type": "chat" - }, + } + ] + }, + "clarifai": { + "id": "clarifai", + "name": "Clarifai", + "display_name": "Clarifai", + "api": "https://api.clarifai.com/v2/ext/openai/v1", + "doc": "https://docs.clarifai.com/compute/inference/", + "models": [ { - "id": "Qwen/Qwen2.5-72B-Instruct", - "name": "Qwen 2.5 72B Instruct", - "display_name": "Qwen 2.5 72B Instruct", + "id": "deepseek-ai/deepseek-ocr/models/DeepSeek-OCR", + "name": "DeepSeek OCR", + "display_name": "DeepSeek OCR", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 8192, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2024-09-19", - "last_updated": "2024-09-19", + "release_date": "2025-10-20", + "last_updated": "2026-02-25", "cost": { - "input": 0.11, - "output": 0.38 + "input": 0.2, + "output": 0.7 }, "type": "chat" }, { - "id": "zai-org/glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "clarifai/main/models/mm-poly-8b", + "name": "MM Poly 8B", + "display_name": "MM Poly 8B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 32768, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "attachment": true, + "open_weights": false, + "release_date": "2025-06", + "last_updated": "2026-02-25", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0.658, + "output": 1.11 }, "type": "chat" }, { - "id": "zai-org/glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "openai/chat-completion/models/gpt-oss-120b-high-throughput", + "name": "GPT OSS 120B High Throughput", + "display_name": "GPT OSS 120B High Throughput", "modalities": { "input": [ "text" @@ -27122,8 +26961,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -27131,31 +26970,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2025-08-05", + "last_updated": "2026-02-25", "cost": { - "input": 1, - "output": 3.2 + "input": 0.09, + "output": 0.36 }, "type": "chat" }, { - "id": "zai-org/glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "openai/chat-completion/models/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -27165,8 +26993,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -27174,20 +27002,25 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-08-05", + "last_updated": "2025-12-12", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0.045, + "output": 0.18 }, "type": "chat" }, { - "id": "zai-org/glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "arcee_ai/AFM/models/trinity-mini", + "name": "Trinity Mini", + "display_name": "Trinity Mini", "modalities": { "input": [ "text" @@ -27197,64 +27030,64 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "knowledge": "2024-10", + "release_date": "2025-12", + "last_updated": "2026-02-25", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0.045, + "output": 0.15 }, "type": "chat" }, { - "id": "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo", - "name": "Llama 3.1 405B Instruct Turbo", - "display_name": "Llama 3.1 405B Instruct Turbo", + "id": "mistralai/completion/models/Ministral-3-14B-Reasoning-2512", + "name": "Ministral 3 14B Reasoning 2512", + "display_name": "Ministral 3 14B Reasoning 2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2025-12", + "release_date": "2025-12-01", + "last_updated": "2025-12-12", "cost": { - "input": 3.5, - "output": 3.5 + "input": 2.5, + "output": 1.7 }, "type": "chat" }, { - "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", - "name": "Llama 4 Maverick 17B 128E Instruct FP8", - "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", + "id": "mistralai/completion/models/Ministral-3-3B-Reasoning-2512", + "name": "Ministral 3 3B Reasoning 2512", + "display_name": "Ministral 3 3B Reasoning 2512", "modalities": { "input": [ "text", @@ -27265,29 +27098,29 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2025-12", + "last_updated": "2026-02-25", "cost": { - "input": 0.14, - "output": 0.59 + "input": 1.039, + "output": 0.54825 }, "type": "chat" }, { - "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "qwen/qwenCoder/models/Qwen3-Coder-30B-A3B-Instruct", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ "text" @@ -27297,8 +27130,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -27307,18 +27140,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2025-04", + "release_date": "2025-07-31", + "last_updated": "2026-02-12", "cost": { - "input": 0.02, - "output": 0.05 + "input": 0.11458, + "output": 0.74812 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "qwen/qwenLM/models/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ "text" @@ -27328,40 +27162,28 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2025-07-30", + "last_updated": "2026-02-25", "cost": { - "input": 3, - "output": 7 + "input": 0.3, + "output": 0.5 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "qwen/qwenLM/models/Qwen3-30B-A3B-Thinking-2507", + "name": "Qwen3 30B A3B Thinking 2507", + "display_name": "Qwen3 30B A3B Thinking 2507", "modalities": { "input": [ "text" @@ -27371,8 +27193,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -27382,23 +27204,29 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2025-06-15", - "last_updated": "2025-06-15", + "release_date": "2025-07-31", + "last_updated": "2026-02-25", "cost": { - "input": 0.27, - "output": 0.4 + "input": 0.36, + "output": 1.3 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", + "id": "minimaxai/chat-completion/models/MiniMax-M2_5-high-throughput", + "name": "MiniMax-M2.5 High Throughput", + "display_name": "MiniMax-M2.5 High Throughput", "modalities": { "input": [ "text" @@ -27408,8 +27236,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -27419,18 +27247,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-25", "cost": { - "input": 0.27, - "output": 1 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT-OSS 120B", - "display_name": "GPT-OSS 120B", + "id": "moonshotai/chat-completion/models/Kimi-K2_6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", @@ -27441,8 +27269,8 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -27452,32 +27280,39 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.08, - "output": 0.44 + "input": 0.95, + "output": 4 }, "type": "chat" } ] }, - "perplexity-agent": { - "id": "perplexity-agent", - "name": "Perplexity Agent", - "display_name": "Perplexity Agent", - "api": "https://api.perplexity.ai/v1", - "doc": "https://docs.perplexity.ai/docs/agent-api/models", + "moark": { + "id": "moark", + "name": "Moark", + "display_name": "Moark", + "api": "https://moark.com/v1", + "doc": "https://moark.com/docs/openapi/v1#tag/%E6%96%87%E6%9C%AC%E7%94%9F%E6%88%90", "models": [ { - "id": "perplexity/sonar", - "name": "Sonar", - "display_name": "Sonar", + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -27487,75 +27322,99 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.25, - "output": 2.5, - "cache_read": 0.0625 + "input": 2.1, + "output": 8.4 }, "type": "chat" }, { - "id": "xai/grok-4-1-fast-non-reasoning", - "name": "Grok 4.1 Fast (Non-Reasoning)", - "display_name": "Grok 4.1 Fast (Non-Reasoning)", + "id": "GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 3.5, + "output": 14 }, "type": "chat" - }, + } + ] + }, + "frogbot": { + "id": "frogbot", + "name": "FrogBot", + "display_name": "FrogBot", + "api": "https://app.frogbot.ai/api/v1", + "doc": "https://docs.frogbot.ai", + "models": [ { - "id": "nvidia/nemotron-3-super-120b-a12b", - "name": "Nemotron 3 Super 120B", - "display_name": "Nemotron 3 Super 120B", + "id": "kimi-k2.5", + "name": "Kimi-K2.5", + "display_name": "Kimi-K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32000 + "context": 256000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -27563,21 +27422,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": true, - "knowledge": "2026-02", - "release_date": "2026-03-11", - "last_updated": "2026-03-11", + "open_weights": false, + "release_date": "1970-01-01", + "last_updated": "1970-01-01", "cost": { - "input": 0.25, - "output": 2.5 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "openai/gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", @@ -27589,10 +27459,10 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -27600,41 +27470,26 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ "text", @@ -27645,165 +27500,123 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "grok-4-3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2024-11", + "release_date": "2026-04-30", + "last_updated": "2026-04-30", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { "input": 1.25, "output": 10, - "cache_read": 0.125 + "cache_read": 0.31 }, "type": "chat" }, { - "id": "openai/gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "grok-4-1-fast-reasoning", + "name": "Grok 4.1 Fast (Reasoning)", + "display_name": "Grok 4.1 Fast (Reasoning)", "modalities": { "input": [ "text", @@ -27814,130 +27627,94 @@ ] }, "limit": { - "context": 1050000, + "context": 2000000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2025-11", + "release_date": "2025-11-25", + "last_updated": "2025-11-25", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "google/gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "deepseek-v4-pro", + "name": "DeepSeek v4 Pro", + "display_name": "DeepSeek v4 Pro", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "knowledge": "2026-01", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 1.74, + "output": 3.48, + "cache_read": 0.14 }, "type": "chat" }, { - "id": "google/gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "gpt-5-5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -27947,119 +27724,84 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "context_over_200k": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 - } + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "grok-4-1-fast-non-reasoning", + "name": "Grok 4.1 Fast (Non-Reasoning)", + "display_name": "Grok 4.1 Fast (Non-Reasoning)", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 2000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2025-11", + "release_date": "2025-11-25", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "grok-code-fast-1", + "name": "Grok 4.1 Fast (Reasoning)", + "display_name": "Grok 4.1 Fast (Reasoning)", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 256000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -28069,53 +27811,69 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, + "attachment": false, + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", + "cost": { + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 + }, + "type": "chat" + }, + { + "id": "minimax-m2-7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 192000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2024-09", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { "input": 0.3, - "output": 2.5, - "cache_read": 0.03 + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -28128,20 +27886,18 @@ "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "release_date": "1970-01-01", + "last_updated": "1970-01-01", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1 + "input": 0.07, + "output": 0.2 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-6", + "id": "claude-sonnet-4-6", "name": "Claude Sonnet 4.6", "display_name": "Claude Sonnet 4.6", "modalities": { @@ -28198,89 +27954,63 @@ "cost": { "input": 3, "output": 15, - "cache_read": 0.3 + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "kimi-k2-6", + "name": "Kimi-K2.6", + "display_name": "Kimi-K2.6", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 256000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "release_date": "1970-01-01", + "last_updated": "1970-01-01", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "gpt-5-3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -28288,25 +28018,41 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "knowledge": "2026-01-31", + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", @@ -28321,7 +28067,7 @@ "context": 200000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -28331,44 +28077,43 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", + "mode": "effort", + "effort": "high", "effort_options": [ "low", "medium", - "high" + "high", + "xhigh" ], "interleaved": true, "summaries": true, - "visibility": "summary", "continuation": [ "thinking_blocks" ], "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { "input": 5, "output": 25, - "cache_read": 0.5 + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "qwen-3-6-plus", + "name": "Qwen 3.6 Plus", + "display_name": "Qwen 3.6 Plus", "modalities": { "input": [ "text", @@ -28380,7 +28125,7 @@ ] }, "limit": { - "context": 200000, + "context": 1000000, "output": 64000 }, "temperature": true, @@ -28389,79 +28134,92 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2026-04-02", + "last_updated": "2026-04-03", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3 + "input": 0.5, + "output": 3, + "cache_read": 0.1 }, "type": "chat" - } - ] - }, - "siliconflow": { - "id": "siliconflow", - "name": "SiliconFlow", - "display_name": "SiliconFlow", - "api": "https://api.siliconflow.cn/v1", - "doc": "https://cloud.siliconflow.com/models", - "models": [ + }, { - "id": "Kwaipilot/KAT-Dev", - "name": "Kwaipilot/KAT-Dev", - "display_name": "Kwaipilot/KAT-Dev", + "id": "gpt-5-4-nano", + "name": "GPT-5.4 Nano", + "display_name": "GPT-5.4 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-09-27", - "last_updated": "2026-01-16", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { "input": 0.2, - "output": 0.6 + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-397B-A17B", - "name": "Qwen/Qwen3.5-397B-A17B", - "display_name": "Qwen/Qwen3.5-397B-A17B", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ "text", "image", - "video" + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1048576, "output": 65536 }, "temperature": true, @@ -28473,87 +28231,109 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.29, - "output": 1.74 + "input": 0.5, + "output": 3, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-35B-A3B", - "name": "Qwen/Qwen3.5-35B-A3B", - "display_name": "Qwen/Qwen3.5-35B-A3B", + "id": "gpt-5-4-mini", + "name": "GPT-5.4 Mini", + "display_name": "GPT-5.4 Mini", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-25", - "last_updated": "2026-02-25", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.23, - "output": 1.86 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-122B-A10B", - "name": "Qwen/Qwen3.5-122B-A10B", - "display_name": "Qwen/Qwen3.5-122B-A10B", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", - "video" + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1048576, "output": 65536 }, "temperature": true, @@ -28565,180 +28345,179 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-07-17", + "last_updated": "2025-07-17", "cost": { - "input": 0.29, - "output": 2.32 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-9B", - "name": "Qwen/Qwen3.5-9B", - "display_name": "Qwen/Qwen3.5-9B", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.22, - "output": 1.74 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-27B", - "name": "Qwen/Qwen3.5-27B", - "display_name": "Qwen/Qwen3.5-27B", + "id": "zai-glm-5-1", + "name": "Z.AI GLM-5.1", + "display_name": "Z.AI GLM-5.1", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 198000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-25", - "last_updated": "2026-02-25", + "knowledge": "2024-10", + "release_date": "2025-01-20", + "last_updated": "2025-02-22", "cost": { - "input": 0.26, - "output": 2.09 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-4B", - "name": "Qwen/Qwen3.5-4B", - "display_name": "Qwen/Qwen3.5-4B", + "id": "minimax-m2-5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 192000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2025-01-15", + "last_updated": "2025-02-22", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "Qwen/Qwen3.6-35B-A3B", - "name": "Qwen/Qwen3.6-35B-A3B", - "display_name": "Qwen/Qwen3.6-35B-A3B", + "id": "gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -28748,61 +28527,69 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "release_date": "1970-01-01", + "last_updated": "1970-01-01", "cost": { - "input": 0.23, - "output": 1.86 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-72B-Instruct", - "name": "Qwen/Qwen2.5-72B-Instruct", - "display_name": "Qwen/Qwen2.5-72B-Instruct", + "id": "gemini-3-1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "knowledge": "2026-01", + "release_date": "2026-02-18", + "last_updated": "2026-02-18", "cost": { - "input": 0.59, - "output": 0.59 + "input": 2, + "output": 12, + "cache_read": 0.2 }, "type": "chat" - }, + } + ] + }, + "cohere": { + "id": "cohere", + "name": "Cohere", + "display_name": "Cohere", + "doc": "https://docs.cohere.com/docs/models", + "models": [ { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "display_name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "id": "c4ai-aya-expanse-32b", + "name": "Aya Expanse 32B", + "display_name": "Aya Expanse 32B", "modalities": { "input": [ "text" @@ -28812,59 +28599,57 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-31", - "last_updated": "2025-11-25", - "cost": { - "input": 0.25, - "output": 1 - } + "open_weights": true, + "release_date": "2024-10-24", + "last_updated": "2024-10-24", + "type": "chat" }, { - "id": "Qwen/Qwen3-VL-8B-Instruct", - "name": "Qwen/Qwen3-VL-8B-Instruct", - "display_name": "Qwen/Qwen3-VL-8B-Instruct", + "id": "command-a-reasoning-08-2025", + "name": "Command A Reasoning", + "display_name": "Command A Reasoning", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.18, - "output": 0.68 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-32B-Instruct", - "name": "Qwen/Qwen3-VL-32B-Instruct", - "display_name": "Qwen/Qwen3-VL-32B-Instruct", + "id": "c4ai-aya-vision-8b", + "name": "Aya Vision 8B", + "display_name": "Aya Vision 8B", "modalities": { "input": [ "text", @@ -28875,28 +28660,24 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 16000, + "output": 4000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-10-21", - "last_updated": "2025-11-25", - "cost": { - "input": 0.2, - "output": 0.6 - }, + "open_weights": true, + "release_date": "2025-03-04", + "last_updated": "2025-05-14", "type": "chat" }, { - "id": "Qwen/Qwen3-VL-30B-A3B-Thinking", - "name": "Qwen/Qwen3-VL-30B-A3B-Thinking", - "display_name": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "id": "command-r-08-2024", + "name": "Command R", + "display_name": "Command R", "modalities": { "input": [ "text" @@ -28906,40 +28687,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-11", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0.29, - "output": 1 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-14B-Instruct", - "name": "Qwen/Qwen2.5-14B-Instruct", - "display_name": "Qwen/Qwen2.5-14B-Instruct", + "id": "command-a-03-2025", + "name": "Command A", + "display_name": "Command A", "modalities": { "input": [ "text" @@ -28949,8 +28719,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 8000 }, "temperature": true, "tool_call": true, @@ -28958,19 +28728,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 0.1, - "output": 0.1 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "id": "c4ai-aya-expanse-8b", + "name": "Aya Expanse 8B", + "display_name": "Aya Expanse 8B", "modalities": { "input": [ "text" @@ -28980,28 +28751,57 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 8000, + "output": 4000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "release_date": "2024-10-24", + "last_updated": "2024-10-24", + "type": "chat" + }, + { + "id": "command-a-vision-07-2025", + "name": "Command A Vision", + "display_name": "Command A Vision", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8000 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "cost": { - "input": 0.3, - "output": 1.5 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "name": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "display_name": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "id": "command-r-plus-08-2024", + "name": "Command R+", + "display_name": "Command R+", "modalities": { "input": [ "text" @@ -29011,40 +28811,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0.14, - "output": 0.57 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-32B-Instruct", - "name": "Qwen/Qwen2.5-VL-32B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-32B-Instruct", + "id": "command-r7b-12-2024", + "name": "Command R7B", + "display_name": "Command R7B", "modalities": { "input": [ "text" @@ -29054,71 +28843,57 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-03-24", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-02-27", + "last_updated": "2024-02-27", "cost": { - "input": 0.27, - "output": 0.27 + "input": 0.0375, + "output": 0.15 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Thinking", - "name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "id": "c4ai-aya-vision-32b", + "name": "Aya Vision 32B", + "display_name": "Aya Vision 32B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 16000, + "output": 4000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", - "cost": { - "input": 0.1, - "output": 0.4 - }, + "open_weights": true, + "release_date": "2025-03-04", + "last_updated": "2025-05-14", "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "id": "command-r7b-arabic-02-2025", + "name": "Command R7B Arabic", + "display_name": "Command R7B Arabic", "modalities": { "input": [ "text" @@ -29128,40 +28903,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-02-27", + "last_updated": "2025-02-27", "cost": { - "input": 0.13, - "output": 0.6 + "input": 0.0375, + "output": 0.15 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-32B-Instruct", - "name": "Qwen/Qwen2.5-32B-Instruct", - "display_name": "Qwen/Qwen2.5-32B-Instruct", + "id": "command-a-translate-08-2025", + "name": "Command A Translate", + "display_name": "Command A Translate", "modalities": { "input": [ "text" @@ -29171,8 +28935,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 8000, + "output": 8000 }, "temperature": true, "tool_call": true, @@ -29180,19 +28944,29 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-09-19", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0.18, - "output": 0.18 + "input": 2.5, + "output": 10 }, "type": "chat" - }, + } + ] + }, + "wandb": { + "id": "wandb", + "name": "Weights & Biases", + "display_name": "Weights & Biases", + "api": "https://api.inference.wandb.ai/v1", + "doc": "https://docs.wandb.ai/guides/integrations/inference/", + "models": [ { - "id": "Qwen/Qwen2.5-72B-Instruct-128K", - "name": "Qwen/Qwen2.5-72B-Instruct-128K", - "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", + "id": "deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text" @@ -29202,8 +28976,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 161000, + "output": 161000 }, "temperature": true, "tool_call": true, @@ -29211,35 +28985,37 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2025-08-21", + "last_updated": "2026-03-12", "cost": { - "input": 0.59, - "output": 0.59 + "input": 0.55, + "output": 1.65 }, "type": "chat" }, { - "id": "Qwen/Qwen3-14B", - "name": "Qwen/Qwen3-14B", - "display_name": "Qwen/Qwen3-14B", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -29252,20 +29028,20 @@ ] } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-03-12", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.5, + "output": 2.85 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Instruct", - "name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "id": "openai/gpt-oss-20b", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ "text" @@ -29276,27 +29052,32 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "release_date": "2025-08-05", + "last_updated": "2026-03-12", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.05, + "output": 0.2 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", - "name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "id": "openai/gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ "text" @@ -29307,26 +29088,32 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-08-01", - "last_updated": "2025-11-25", + "release_date": "2025-08-05", + "last_updated": "2026-03-12", "cost": { - "input": 0.07, - "output": 0.28 - } + "input": 0.15, + "output": 0.6 + }, + "type": "chat" }, { - "id": "Qwen/Qwen3-32B", - "name": "Qwen/Qwen3-32B", - "display_name": "Qwen/Qwen3-32B", + "id": "zai-org/GLM-5-FP8", + "name": "GLM 5", + "display_name": "GLM 5", "modalities": { "input": [ "text" @@ -29336,39 +29123,28 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 200000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-03-12", "cost": { - "input": 0.14, - "output": 0.57 + "input": 1, + "output": 3.2 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "display_name": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "id": "nvidia/NVIDIA-Nemotron-3-Super-120B-A12B-FP8", + "name": "NVIDIA Nemotron 3 Super 120B", + "display_name": "NVIDIA Nemotron 3 Super 120B", "modalities": { "input": [ "text" @@ -29378,8 +29154,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -29387,19 +29163,19 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-23", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2026-03-11", + "last_updated": "2026-03-12", "cost": { - "input": 0.09, - "output": 0.6 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "display_name": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "id": "microsoft/Phi-4-mini-instruct", + "name": "Phi-4-mini-instruct", + "display_name": "Phi-4-mini-instruct", "modalities": { "input": [ "text" @@ -29409,28 +29185,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-30", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2026-03-12", "cost": { - "input": 0.09, - "output": 0.3 + "input": 0.08, + "output": 0.35 }, "type": "chat" }, { - "id": "Qwen/Qwen3-8B", - "name": "Qwen/Qwen3-8B", - "display_name": "Qwen/Qwen3-8B", + "id": "OpenPipe/Qwen3-14B-Instruct", + "name": "OpenPipe Qwen3 14B Instruct", + "display_name": "OpenPipe Qwen3 14B Instruct", "modalities": { "input": [ "text" @@ -29440,39 +29218,28 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2025-04-29", + "last_updated": "2026-03-12", "cost": { - "input": 0.06, - "output": 0.06 + "input": 0.05, + "output": 0.22 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "id": "meta-llama/Llama-3.1-8B-Instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" @@ -29482,28 +29249,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2026-03-12", "cost": { - "input": 0.14, - "output": 1.4 + "input": 0.22, + "output": 0.22 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-8B-Thinking", - "name": "Qwen/Qwen3-VL-8B-Thinking", - "display_name": "Qwen/Qwen3-VL-8B-Thinking", + "id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "display_name": "Llama 4 Scout 17B 16E Instruct", "modalities": { "input": [ "text", @@ -29514,8 +29283,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 64000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -29523,31 +29292,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-31", + "last_updated": "2026-03-12", "cost": { - "input": 0.18, - "output": 2 + "input": 0.17, + "output": 0.66 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Captioner", - "name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "id": "meta-llama/Llama-3.1-70B-Instruct", + "name": "Llama 3.1 70B", + "display_name": "Llama 3.1 70B", "modalities": { "input": [ "text" @@ -29557,28 +29316,28 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2026-03-12", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.8, + "output": 0.8 }, "type": "chat" }, { - "id": "Qwen/QwQ-32B", - "name": "Qwen/QwQ-32B", - "display_name": "Qwen/QwQ-32B", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -29588,14 +29347,84 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2026-03-12", + "cost": { + "input": 0.71, + "output": 0.71 + }, + "type": "chat" + }, + { + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 196608, + "output": 196608 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-03-12", + "cost": { + "input": 0.3, + "output": 1.2 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen3-235B-A22B-Thinking-2507", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, "extra_capabilities": { "reasoning": { "supported": true, @@ -29608,19 +29437,20 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-03-06", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2026-03-12", "cost": { - "input": 0.15, - "output": 0.58 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", - "name": "Qwen/Qwen3-VL-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ "text" @@ -29630,28 +29460,28 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-05", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-29", + "last_updated": "2026-03-12", "cost": { - "input": 0.29, - "output": 1 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-Coder-32B-Instruct", - "name": "Qwen/Qwen2.5-Coder-32B-Instruct", - "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -29661,8 +29491,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -29670,18 +29500,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-11-11", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2026-03-12", "cost": { - "input": 0.18, - "output": 0.18 - } + "input": 0.1, + "output": 0.1 + }, + "type": "chat" }, { - "id": "Qwen/Qwen2.5-7B-Instruct", - "name": "Qwen/Qwen2.5-7B-Instruct", - "display_name": "Qwen/Qwen2.5-7B-Instruct", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen3-Coder-480B-A35B-Instruct", + "display_name": "Qwen3-Coder-480B-A35B-Instruct", "modalities": { "input": [ "text" @@ -29691,8 +29523,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -29700,19 +29532,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2026-03-12", "cost": { - "input": 0.05, - "output": 0.05 + "input": 1, + "output": 1.5 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-235B-A22B-Thinking", - "name": "Qwen/Qwen3-VL-235B-A22B-Thinking", - "display_name": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "id": "zai-org/GLM-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -29722,8 +29555,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -29742,20 +29575,31 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.45, - "output": 3.5 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "gmicloud": { + "id": "gmicloud", + "name": "GMI Cloud", + "display_name": "GMI Cloud", + "api": "https://api.gmi-serving.com/v1", + "doc": "https://docs.gmicloud.ai/inference-engine/api-reference/llm-api-reference", + "models": [ { - "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", - "name": "Qwen/Qwen3-30B-A3B-Thinking-2507", - "display_name": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "id": "deepseek-ai/DeepSeek-V4-Flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -29765,8 +29609,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048575, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -29786,31 +29630,32 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-31", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.09, - "output": 0.3 + "input": 0.112, + "output": 0.224, + "cache_read": 0.022 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-32B-Thinking", - "name": "Qwen/Qwen3-VL-32B-Thinking", - "display_name": "Qwen/Qwen3-VL-32B-Thinking", + "id": "deepseek-ai/DeepSeek-V4-Pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1048576, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -29829,20 +29674,22 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-21", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.2, - "output": 1.5 + "input": 1.392, + "output": 2.784, + "cache_read": 0.116 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-72B-Instruct", - "name": "Qwen/Qwen2.5-VL-72B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-72B-Instruct", + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text" @@ -29852,28 +29699,42 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "release_date": "2025-01-28", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.59, - "output": 0.59 + "input": 0.855, + "output": 3.6, + "cache_read": 0.144 }, "type": "chat" }, { - "id": "stepfun-ai/Step-3.5-Flash", - "name": "stepfun-ai/Step-3.5-Flash", - "display_name": "stepfun-ai/Step-3.5-Flash", + "id": "zai-org/GLM-5.1-FP8", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -29883,8 +29744,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -29892,20 +29753,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.98, + "output": 3.08, + "cache_read": 0.182 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5V", - "name": "zai-org/GLM-4.5V", - "display_name": "zai-org/GLM-4.5V", + "id": "zai-org/GLM-5-FP8", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -29915,28 +29788,41 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-13", - "last_updated": "2025-11-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.14, - "output": 0.86 + "input": 0.6, + "output": 1.92, + "cache_read": 0.12 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6", - "name": "zai-org/GLM-4.6", - "display_name": "zai-org/GLM-4.6", + "id": "anthropic/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text" @@ -29946,66 +29832,117 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 409600, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.5, - "output": 1.9 + "input": 3, + "output": 15, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6V", - "name": "zai-org/GLM-4.6V", - "display_name": "zai-org/GLM-4.6V", + "id": "anthropic/claude-opus-4.6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 409600, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-12-07", - "last_updated": "2025-12-07", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.3, - "output": 0.9 + "input": 5, + "output": 25, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5-Air", - "name": "zai-org/GLM-4.5-Air", - "display_name": "zai-org/GLM-4.5-Air", + "id": "anthropic/claude-opus-4.7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text" @@ -30015,59 +29952,111 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 409600, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.14, - "output": 0.86 + "input": 4.5, + "output": 22.5, + "cache_read": 0.45 }, "type": "chat" - }, + } + ] + }, + "ambient": { + "id": "ambient", + "name": "Ambient", + "display_name": "Ambient", + "api": "https://api.ambient.xyz/v1", + "doc": "https://ambient.xyz", + "models": [ { - "id": "inclusionAI/Ling-flash-2.0", - "name": "inclusionAI/Ling-flash-2.0", - "display_name": "inclusionAI/Ling-flash-2.0", + "id": "moonshotai/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.95, + "output": 4, + "cache_read": 0.2, + "cache_write": 0 }, "type": "chat" }, { - "id": "inclusionAI/Ling-mini-2.0", - "name": "inclusionAI/Ling-mini-2.0", - "display_name": "inclusionAI/Ling-mini-2.0", + "id": "zai-org/GLM-5.1-FP8", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -30077,28 +30066,51 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-09-10", - "last_updated": "2025-11-25", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.07, - "output": 0.28 + "input": 1.4, + "output": 4.4, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "routing-run": { + "id": "routing-run", + "name": "routing.run", + "display_name": "routing.run", + "api": "https://api.routing.run/v1", + "doc": "https://docs.routing.run/api-reference/models", + "models": [ { - "id": "inclusionAI/Ring-flash-2.0", - "name": "inclusionAI/Ring-flash-2.0", - "display_name": "inclusionAI/Ring-flash-2.0", + "id": "route/deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -30108,8 +30120,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, @@ -30123,40 +30135,55 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.4928, + "output": 0.7392 }, "type": "chat" }, { - "id": "ascend-tribe/pangu-pro-moe", - "name": "ascend-tribe/pangu-pro-moe", - "display_name": "ascend-tribe/pangu-pro-moe", + "id": "route/qwen3.5-9b", + "name": "Qwen3.5 9B", + "display_name": "Qwen3.5 9B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-07-02", - "last_updated": "2026-01-16", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-03-10", + "last_updated": "2026-03-10", "cost": { "input": 0.2, "output": 0.6 @@ -30164,84 +30191,69 @@ "type": "chat" }, { - "id": "tencent/Hunyuan-MT-7B", - "name": "tencent/Hunyuan-MT-7B", - "display_name": "tencent/Hunyuan-MT-7B", + "id": "route/qwen3.5-9b-chat", + "name": "Qwen3.5 9B Chat", + "display_name": "Qwen3.5 9B Chat", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - }, - { - "id": "tencent/Hunyuan-A13B-Instruct", - "name": "tencent/Hunyuan-A13B-Instruct", - "display_name": "tencent/Hunyuan-A13B-Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 + "supported": true, + "default": true }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-06-30", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "release_date": "2026-03-10", + "last_updated": "2026-03-10", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "Pro/zai-org/GLM-4.7", - "name": "Pro/zai-org/GLM-4.7", - "display_name": "Pro/zai-org/GLM-4.7", + "id": "route/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -30259,19 +30271,21 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0.462, + "output": 2.42, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "Pro/zai-org/GLM-5.1", - "name": "Pro/zai-org/GLM-5.1", - "display_name": "Pro/zai-org/GLM-5.1", + "id": "route/minimax-m2.7-highspeed", + "name": "MiniMax M2.7 Highspeed", + "display_name": "MiniMax M2.7 Highspeed", "modalities": { "input": [ "text" @@ -30281,8 +30295,8 @@ ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 100000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -30303,19 +30317,20 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1.4, - "output": 4.4, - "cache_write": 0 + "input": 0.33, + "output": 1.32, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "Pro/zai-org/GLM-5", - "name": "Pro/zai-org/GLM-5", - "display_name": "Pro/zai-org/GLM-5", + "id": "route/glm-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ "text" @@ -30325,8 +30340,8 @@ ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 202752, + "output": 202752 }, "temperature": true, "tool_call": true, @@ -30346,19 +30361,21 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { "input": 1, - "output": 3.2 + "output": 3, + "cache_read": 0.26, + "cache_write": 0 }, "type": "chat" }, { - "id": "Pro/deepseek-ai/DeepSeek-V3", - "name": "Pro/deepseek-ai/DeepSeek-V3", - "display_name": "Pro/deepseek-ai/DeepSeek-V3", + "id": "route/step-3.5-flash-full", + "name": "Step 3.5 Flash Full", + "display_name": "Step 3.5 Flash Full", "modalities": { "input": [ "text" @@ -30368,39 +30385,45 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-26", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-29", + "last_updated": "2026-02-13", "cost": { - "input": 0.25, - "output": 1 + "input": 0.096, + "output": 0.288, + "cache_read": 0.019 }, "type": "chat" }, { - "id": "Pro/deepseek-ai/DeepSeek-R1", - "name": "Pro/deepseek-ai/DeepSeek-R1", - "display_name": "Pro/deepseek-ai/DeepSeek-R1", + "id": "route/qwen3.6-27b", + "name": "Qwen3.6 27B", + "display_name": "Qwen3.6 27B", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -30419,33 +30442,35 @@ ] } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.5, - "output": 2.18 + "input": 1.1, + "output": 3.3 }, "type": "chat" }, { - "id": "Pro/deepseek-ai/DeepSeek-V3.2", - "name": "Pro/deepseek-ai/DeepSeek-V3.2", - "display_name": "Pro/deepseek-ai/DeepSeek-V3.2", + "id": "route/kimi-k2.5-highspeed", + "name": "Kimi K2.5 Highspeed", + "display_name": "Kimi K2.5 Highspeed", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 131072, + "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -30453,55 +30478,31 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-03", - "last_updated": "2025-12-03", - "cost": { - "input": 0.27, - "output": 0.42 - }, - "type": "chat" - }, - { - "id": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", - "display_name": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.27, - "output": 1 + "input": 0.6468, + "output": 3.388, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "Pro/moonshotai/Kimi-K2-Thinking", - "name": "Pro/moonshotai/Kimi-K2-Thinking", - "display_name": "Pro/moonshotai/Kimi-K2-Thinking", + "id": "route/deepseek-v4-pro-precision", + "name": "DeepSeek V4 Pro Precision", + "display_name": "DeepSeek V4 Pro Precision", "modalities": { "input": [ "text" @@ -30511,8 +30512,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1000000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -30532,31 +30533,32 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-11-07", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.55, - "output": 2.5 + "input": 0.7392, + "output": 1.1088, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "Pro/moonshotai/Kimi-K2.6", - "name": "Pro/moonshotai/Kimi-K2.6", - "display_name": "Pro/moonshotai/Kimi-K2.6", + "id": "route/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1000000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -30577,19 +30579,20 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.4928, + "output": 0.7392, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "Pro/moonshotai/Kimi-K2-Instruct-0905", - "name": "Pro/moonshotai/Kimi-K2-Instruct-0905", - "display_name": "Pro/moonshotai/Kimi-K2-Instruct-0905", + "id": "route/glm-5-highspeed", + "name": "GLM 5 Highspeed", + "display_name": "GLM 5 Highspeed", "modalities": { "input": [ "text" @@ -30599,40 +30602,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-08", - "last_updated": "2025-11-25", - "cost": { - "input": 0.4, - "output": 2 - }, - "type": "chat" - }, - { - "id": "Pro/moonshotai/Kimi-K2.5", - "name": "Pro/moonshotai/Kimi-K2.5", - "display_name": "Pro/moonshotai/Kimi-K2.5", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262000, - "output": 262000 + "context": 202752, + "output": 202752 }, "temperature": true, "tool_call": true, @@ -30653,18 +30624,20 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.45, - "output": 2.25 + "input": 1.1088, + "output": 3.542, + "cache_read": 0.2, + "cache_write": 0 }, "type": "chat" }, { - "id": "Pro/MiniMaxAI/MiniMax-M2.5", - "name": "Pro/MiniMaxAI/MiniMax-M2.5", - "display_name": "Pro/MiniMaxAI/MiniMax-M2.5", + "id": "route/mimo-v2.5-pro", + "name": "MiMo V2.5 Pro", + "display_name": "MiMo V2.5 Pro", "modalities": { "input": [ "text" @@ -30674,13 +30647,14 @@ ] }, "limit": { - "context": 192000, - "output": 131000 + "context": 1000000, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -30694,19 +30668,37 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-13", - "last_updated": "2026-02-13", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.3, - "output": 1.22 + "input": 0.45, + "output": 1.35, + "cache_read": 0.2, + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ] }, "type": "chat" }, { - "id": "Pro/MiniMaxAI/MiniMax-M2.1", - "name": "Pro/MiniMaxAI/MiniMax-M2.1", - "display_name": "Pro/MiniMaxAI/MiniMax-M2.1", + "id": "route/minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -30716,13 +30708,14 @@ ] }, "limit": { - "context": 197000, - "output": 131000 + "context": 100000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -30730,19 +30723,21 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.193, + "output": 1.238, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "PaddlePaddle/PaddleOCR-VL", - "name": "PaddlePaddle/PaddleOCR-VL", - "display_name": "PaddlePaddle/PaddleOCR-VL", + "id": "route/gemma-4-31b-it", + "name": "Gemma 4 31B IT", + "display_name": "Gemma 4 31B IT", "modalities": { "input": [ "text", @@ -30753,90 +30748,115 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 131072, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-10-16", - "last_updated": "2025-10-16", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "PaddlePaddle/PaddleOCR-VL-1.5", - "name": "PaddlePaddle/PaddleOCR-VL-1.5", - "display_name": "PaddlePaddle/PaddleOCR-VL-1.5", + "id": "route/qwen3.5-397b-a17b", + "name": "Qwen3.5 397B-A17B", + "display_name": "Qwen3.5 397B-A17B", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": true, - "release_date": "2026-01-29", - "last_updated": "2026-01-29", + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 0, - "output": 0 + "input": 1.1, + "output": 3.3 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-OCR", - "name": "deepseek-ai/DeepSeek-OCR", - "display_name": "deepseek-ai/DeepSeek-OCR", + "id": "route/glm-4.7-flash", + "name": "GLM 4.7 Flash", + "display_name": "GLM 4.7 Flash", "modalities": { "input": [ - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": true, - "release_date": "2025-10-20", - "last_updated": "2025-10-20", + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0, - "output": 0 - } + "input": 1.32, + "output": 4.4, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "deepseek-ai/DeepSeek-V3.1-Terminus", - "display_name": "deepseek-ai/DeepSeek-V3.1-Terminus", + "id": "route/glm-5.1-full", + "name": "GLM 5.1 Full", + "display_name": "GLM 5.1 Full", "modalities": { "input": [ "text" @@ -30846,8 +30866,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 202752, + "output": 202752 }, "temperature": true, "tool_call": true, @@ -30855,20 +30875,33 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.27, - "output": 1 + "input": 1.2, + "output": 3.5, + "cache_read": 0.26, + "cache_write": 0 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "deepseek-ai/DeepSeek-V3.2", - "display_name": "deepseek-ai/DeepSeek-V3.2", + "id": "route/minimax-m2.7", + "name": "MiniMax M2.7", + "display_name": "MiniMax M2.7", "modalities": { "input": [ "text" @@ -30878,8 +30911,8 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 100000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -30889,34 +30922,43 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-03", - "last_updated": "2025-12-03", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.27, - "output": 0.42 + "input": 0.33, + "output": 1.32, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "id": "route/mistral-small-2503", + "name": "Mistral Small 2503", + "display_name": "Mistral Small 2503", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -30924,20 +30966,21 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1", - "name": "deepseek-ai/DeepSeek-R1", - "display_name": "deepseek-ai/DeepSeek-R1", + "id": "route/mimo-v2.5-pro-precision", + "name": "MiMo V2.5 Pro Precision", + "display_name": "MiMo V2.5 Pro Precision", "modalities": { "input": [ "text" @@ -30947,8 +30990,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -30968,19 +31011,37 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.5, - "output": 2.18 + "input": 0.45, + "output": 1.35, + "cache_read": 0.2, + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ] }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "id": "route/stepfun-3.5-flash", + "name": "StepFun 3.5 Flash", + "display_name": "StepFun 3.5 Flash", "modalities": { "input": [ "text" @@ -30990,8 +31051,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -31000,50 +31061,54 @@ "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-29", + "last_updated": "2026-02-13", "cost": { - "input": 0.18, - "output": 0.18 + "input": 0.096, + "output": 0.288, + "cache_read": 0.019 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3", - "name": "deepseek-ai/DeepSeek-V3", - "display_name": "deepseek-ai/DeepSeek-V3", + "id": "route/mistral-large-3", + "name": "Mistral Large 3", + "display_name": "Mistral Large 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2024-12-26", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", "cost": { - "input": 0.25, - "output": 1 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-vl2", - "name": "deepseek-ai/deepseek-vl2", - "display_name": "deepseek-ai/deepseek-vl2", + "id": "route/step-3.5-flash-2603", + "name": "Step 3.5 Flash 2603", + "display_name": "Step 3.5 Flash 2603", "modalities": { "input": [ "text" @@ -31053,90 +31118,128 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-12-13", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.1, + "output": 0.3, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "baidu/ERNIE-4.5-300B-A47B", - "name": "baidu/ERNIE-4.5-300B-A47B", - "display_name": "baidu/ERNIE-4.5-300B-A47B", + "id": "route/mistral-medium-2505", + "name": "Mistral Medium 2505", + "display_name": "Mistral Medium 2505", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-02", - "last_updated": "2025-11-25", + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0.28, - "output": 1.1 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-32B-0414", - "name": "THUDM/GLM-Z1-32B-0414", - "display_name": "THUDM/GLM-Z1-32B-0414", + "id": "route/mimo-v2.5", + "name": "MiMo V2.5", + "display_name": "MiMo V2.5", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.4, + "output": 2, + "cache_read": 0.08, + "context_over_200k": { + "input": 0.8, + "output": 4, + "cache_read": 0.16 + }, + "tiers": [ + { + "input": 0.8, + "output": 4, + "cache_read": 0.16, + "tier": { + "type": "context", + "size": 256000 + } + } + ] }, "type": "chat" }, { - "id": "THUDM/GLM-4-32B-0414", - "name": "THUDM/GLM-4-32B-0414", - "display_name": "THUDM/GLM-4-32B-0414", + "id": "route/deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -31146,28 +31249,42 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.27, - "output": 0.27 + "input": 0.4928, + "output": 0.7392, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "THUDM/GLM-4-9B-0414", - "name": "THUDM/GLM-4-9B-0414", - "display_name": "THUDM/GLM-4-9B-0414", + "id": "route/glm-5.1-precision", + "name": "GLM 5.1 Precision", + "display_name": "GLM 5.1 Precision", "modalities": { "input": [ "text" @@ -31177,90 +31294,136 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 202752, + "output": 202752 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.086, - "output": 0.086 + "input": 1.2, + "output": 3.5, + "cache_read": 0.26, + "cache_write": 0 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-9B-0414", - "name": "THUDM/GLM-Z1-9B-0414", - "display_name": "THUDM/GLM-Z1-9B-0414", + "id": "route/kimi-k2.6-precision", + "name": "Kimi K2.6 Precision", + "display_name": "Kimi K2.6 Precision", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.086, - "output": 0.086 + "input": 0.6468, + "output": 3.388, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "moonshotai/Kimi-K2-Instruct-0905", - "display_name": "moonshotai/Kimi-K2-Instruct-0905", + "id": "route/kimi-k2.6-full", + "name": "Kimi K2.6 Full", + "display_name": "Kimi K2.6 Full", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-08", - "last_updated": "2025-11-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.4, - "output": 2 + "input": 0.462, + "output": 2.42, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "moonshotai/Kimi-K2-Thinking", - "display_name": "moonshotai/Kimi-K2-Thinking", + "id": "route/step-3.5-flash", + "name": "Step 3.5 Flash", + "display_name": "Step 3.5 Flash", "modalities": { "input": [ "text" @@ -31270,8 +31433,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -31279,31 +31442,22 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "release_date": "2025-11-07", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-29", + "last_updated": "2026-02-13", "cost": { - "input": 0.55, - "output": 2.5 + "input": 0.096, + "output": 0.288, + "cache_read": 0.019 }, "type": "chat" }, { - "id": "ByteDance-Seed/Seed-OSS-36B-Instruct", - "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", - "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "id": "route/minimax-m2.5-highspeed", + "name": "MiniMax M2.5 Highspeed", + "display_name": "MiniMax M2.5 Highspeed", "modalities": { "input": [ "text" @@ -31313,13 +31467,14 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 100000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -31327,19 +31482,21 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-04", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", "cost": { - "input": 0.21, - "output": 0.57 + "input": 0.193, + "output": 1.238, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2-Exp", - "name": "deepseek-ai/DeepSeek-V3.2-Exp", - "display_name": "deepseek-ai/DeepSeek-V3.2-Exp", + "id": "route/glm-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ "text" @@ -31349,19 +31506,43 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "cost": { + "input": 1.32, + "output": 4.4, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", - "name": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", - "display_name": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", + "id": "route/glm-5.1-fp16", + "name": "GLM 5.1 FP16", + "display_name": "GLM 5.1 FP16", "modalities": { "input": [ "text" @@ -31371,19 +31552,42 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 202752, + "output": 202752 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", + "cost": { + "input": 1.2, + "output": 3.5, + "cache_read": 0.26, + "cache_write": 0 }, "type": "chat" }, { - "id": "inclusionAI/Ring-1T", - "name": "inclusionAI/Ring-1T", - "display_name": "inclusionAI/Ring-1T", + "id": "route/glm-5", + "name": "GLM 5", + "display_name": "GLM 5", "modalities": { "input": [ "text" @@ -31393,9 +31597,10 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 202752, + "output": 202752 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -31403,15 +31608,31 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "cost": { + "input": 0.792, + "output": 2.53, + "cache_read": 0.2, + "cache_write": 0 + }, "type": "chat" }, { - "id": "inclusionAI/Ling-1T", - "name": "inclusionAI/Ling-1T", - "display_name": "inclusionAI/Ling-1T", + "id": "route/deepseek-v4-flash-full", + "name": "DeepSeek V4 Flash Full", + "display_name": "DeepSeek V4 Flash Full", "modalities": { "input": [ "text" @@ -31421,107 +31642,98 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", + "cost": { + "input": 0.4928, + "output": 0.7392, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "Qwen/Qwen-Image-Edit-2509", - "name": "Qwen/Qwen-Image-Edit-2509", - "display_name": "Qwen/Qwen-Image-Edit-2509", + "id": "route/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ + "text", "image", - "text" + "video" ], "output": [ - "image" - ] - }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, - { - "id": "Qwen/Qwen-Image-Edit", - "name": "Qwen/Qwen-Image-Edit", - "display_name": "Qwen/Qwen-Image-Edit", - "modalities": { - "input": [ - "image", "text" - ], - "output": [ - "image" ] }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, - { - "id": "Qwen/Qwen-Image", - "name": "Qwen/Qwen-Image", - "display_name": "Qwen/Qwen-Image", - "modalities": { - "input": [ - "text" - ], - "output": [ - "image" - ] + "limit": { + "context": 262144, + "output": 262144 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } - }, - { - "id": "Wan-AI/Wan2.2-I2V-A14B", - "name": "Wan-AI/Wan2.2-I2V-A14B", - "display_name": "Wan-AI/Wan2.2-I2V-A14B", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "video" - ] + "supported": true, + "default": true }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, - { - "id": "Wan-AI/Wan2.2-T2V-A14B", - "name": "Wan-AI/Wan2.2-T2V-A14B", - "display_name": "Wan-AI/Wan2.2-T2V-A14B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "video" - ] + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", + "cost": { + "input": 0.462, + "output": 2.42, + "cache_read": 0.16 + }, + "type": "chat" + } + ] + }, + "the-grid-ai": { + "id": "the-grid-ai", + "name": "The Grid AI", + "display_name": "The Grid AI", + "api": "https://api.thegrid.ai/v1", + "doc": "https://thegrid.ai/docs", + "models": [ { - "id": "zai-org/GLM-4.5", - "name": "zai-org/GLM-4.5", - "display_name": "zai-org/GLM-4.5", + "id": "text-max", + "name": "Text Max", + "display_name": "Text Max", "modalities": { "input": [ "text" @@ -31531,19 +31743,25 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-24", + "last_updated": "2026-03-24", "type": "chat" }, { - "id": "stepfun-ai/step3", - "name": "stepfun-ai/step3", - "display_name": "stepfun-ai/step3", + "id": "text-prime", + "name": "Text Prime", + "display_name": "Text Prime", "modalities": { "input": [ "text" @@ -31553,36 +31771,25 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 30000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, + "attachment": false, + "open_weights": false, + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "type": "chat" }, { - "id": "TeleAI/TeleSpeechASR", - "name": "TeleAI/TeleSpeechASR", - "display_name": "TeleAI/TeleSpeechASR", - "modalities": { - "input": [ - "audio" - ], - "output": [ - "text" - ] - }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, - { - "id": "THUDM/GLM-4.1V-9B-Thinking", - "name": "THUDM/GLM-4.1V-9B-Thinking", - "display_name": "THUDM/GLM-4.1V-9B-Thinking", + "id": "text-standard", + "name": "Text Standard", + "display_name": "Text Standard", "modalities": { "input": [ "text" @@ -31592,20 +31799,34 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "attachment": false, + "open_weights": false, + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "type": "chat" - }, + } + ] + }, + "fastrouter": { + "id": "fastrouter", + "name": "FastRouter", + "display_name": "FastRouter", + "api": "https://go.fastrouter.ai/api/v1", + "doc": "https://fastrouter.ai/models", + "models": [ { - "id": "Pro/THUDM/GLM-4.1V-9B-Thinking", - "name": "Pro/THUDM/GLM-4.1V-9B-Thinking", - "display_name": "Pro/THUDM/GLM-4.1V-9B-Thinking", + "id": "deepseek-ai/deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ "text" @@ -31616,19 +31837,34 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 131072 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-01-23", + "last_updated": "2025-01-23", + "cost": { + "input": 0.03, + "output": 0.14 + }, "type": "chat" }, { - "id": "moonshotai/Kimi-Dev-72B", - "name": "moonshotai/Kimi-Dev-72B", - "display_name": "moonshotai/Kimi-Dev-72B", + "id": "moonshotai/kimi-k2", + "name": "Kimi K2", + "display_name": "Kimi K2", "modalities": { "input": [ "text" @@ -31639,18 +31875,28 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", + "cost": { + "input": 0.55, + "output": 2.2 + }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M1-80k", - "name": "MiniMaxAI/MiniMax-M1-80k", - "display_name": "MiniMaxAI/MiniMax-M1-80k", + "id": "z-ai/glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -31660,19 +31906,40 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 204800, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "cost": { + "input": 0.95, + "output": 3.15 }, "type": "chat" }, { - "id": "Tongyi-Zhiwen/QwenLong-L1-32B", - "name": "Tongyi-Zhiwen/QwenLong-L1-32B", - "display_name": "Tongyi-Zhiwen/QwenLong-L1-32B", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -31683,308 +31950,586 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.05, + "output": 0.2 + }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", - "name": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", - "display_name": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 + }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B", - "name": "Qwen/Qwen3-30B-A3B", - "display_name": "Qwen/Qwen3-30B-A3B", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.025 + }, "type": "chat" }, { - "id": "Qwen/Qwen3-Reranker-8B", - "name": "Qwen/Qwen3-Reranker-8B", - "display_name": "Qwen/Qwen3-Reranker-8B", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" ], "output": [ - "score" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 131072, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - }, - "type": "rerank" - }, - { - "id": "Qwen/Qwen3-Embedding-8B", - "name": "Qwen/Qwen3-Embedding-8B", - "display_name": "Qwen/Qwen3-Embedding-8B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "embedding" - ] + "supported": true, + "default": true }, - "limit": { - "context": 8192, - "output": 2048 + "extra_capabilities": { + "reasoning": { + "supported": true + } }, - "tool_call": false, - "reasoning": { - "supported": false + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.15, + "output": 0.6 }, - "type": "embedding" + "type": "chat" }, { - "id": "Qwen/Qwen3-Reranker-4B", - "name": "Qwen/Qwen3-Reranker-4B", - "display_name": "Qwen/Qwen3-Reranker-4B", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "score" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "rerank" + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + }, + "type": "chat" }, { - "id": "Qwen/Qwen3-Embedding-4B", - "name": "Qwen/Qwen3-Embedding-4B", - "display_name": "Qwen/Qwen3-Embedding-4B", + "id": "x-ai/grok-4", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ "text" ], "output": [ - "embedding" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 256000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.75, + "cache_write": 15 + }, + "type": "chat" }, { - "id": "Qwen/Qwen3-Reranker-0.6B", - "name": "Qwen/Qwen3-Reranker-0.6B", - "display_name": "Qwen/Qwen3-Reranker-0.6B", + "id": "qwen/qwen3-coder", + "name": "Qwen3 Coder", + "display_name": "Qwen3 Coder", "modalities": { "input": [ "text" ], "output": [ - "score" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 262144, + "output": 66536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "rerank" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "cost": { + "input": 0.3, + "output": 1.2 + }, + "type": "chat" }, { - "id": "Qwen/Qwen3-Embedding-0.6B", - "name": "Qwen/Qwen3-Embedding-0.6B", - "display_name": "Qwen/Qwen3-Embedding-0.6B", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "embedding" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 1048576, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.31 + }, + "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B", - "name": "Qwen/Qwen3-235B-A22B", - "display_name": "Qwen/Qwen3-235B-A22B", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.0375 + }, "type": "chat" }, { - "id": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", - "name": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", - "display_name": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1047576, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 2, + "output": 8, + "cache_read": 0.5 + }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "id": "anthropic/claude-opus-4.1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 32000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + }, "type": "chat" }, { - "id": "Qwen/QVQ-72B-Preview", - "name": "Qwen/QVQ-72B-Preview", - "display_name": "Qwen/QVQ-72B-Preview", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + }, "type": "chat" - }, + } + ] + }, + "tencent-coding-plan": { + "id": "tencent-coding-plan", + "name": "Tencent Coding Plan (China)", + "display_name": "Tencent Coding Plan (China)", + "api": "https://api.lkeap.cloud.tencent.com/coding/v3", + "doc": "https://cloud.tencent.com/document/product/1772/128947", + "models": [ { - "id": "deepseek-ai/DeepSeek-V2.5", - "name": "deepseek-ai/DeepSeek-V2.5", - "display_name": "deepseek-ai/DeepSeek-V2.5", + "id": "kimi-k2.5", + "name": "Kimi-K2.5", + "display_name": "Kimi-K2.5", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" + }, + { + "id": "hunyuan-turbos", + "name": "Hunyuan-TurboS", + "display_name": "Hunyuan-TurboS", "modalities": { "input": [ "text" @@ -31995,86 +32540,185 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-08", + "last_updated": "2026-03-08", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, "type": "chat" }, { - "id": "fnlp/MOSS-TTSD-v0.5", - "name": "fnlp/MOSS-TTSD-v0.5", - "display_name": "fnlp/MOSS-TTSD-v0.5", + "id": "hunyuan-2.0-thinking", + "name": "Tencent HY 2.0 Think", + "display_name": "Tencent HY 2.0 Think", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, - "tool_call": false, + "limit": { + "context": 131072, + "output": 16384 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-08", + "last_updated": "2026-03-08", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" }, { - "id": "FunAudioLLM/CosyVoice2-0.5B", - "name": "FunAudioLLM/CosyVoice2-0.5B", - "display_name": "FunAudioLLM/CosyVoice2-0.5B", + "id": "hunyuan-2.0-instruct", + "name": "Tencent HY 2.0 Instruct", + "display_name": "Tencent HY 2.0 Instruct", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, - "tool_call": false, + "limit": { + "context": 131072, + "output": 16384 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false - } + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-08", + "last_updated": "2026-03-08", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" }, { - "id": "FunAudioLLM/SenseVoiceSmall", - "name": "FunAudioLLM/SenseVoiceSmall", - "display_name": "FunAudioLLM/SenseVoiceSmall", + "id": "tc-code-latest", + "name": "Auto", + "display_name": "Auto", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, - "tool_call": false, + "limit": { + "context": 131072, + "output": 16384 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false - } + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-08", + "last_updated": "2026-03-08", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" }, { - "id": "IndexTeam/IndexTTS-2", - "name": "IndexTeam/IndexTTS-2", - "display_name": "IndexTeam/IndexTTS-2", + "id": "minimax-m2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, - "tool_call": false, + "limit": { + "context": 204800, + "output": 32768 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" }, { - "id": "BAAI/bge-m3", - "name": "BAAI/bge-m3", - "display_name": "BAAI/bge-m3", + "id": "hunyuan-t1", + "name": "Hunyuan-T1", + "display_name": "Hunyuan-T1", "modalities": { "input": [ "text" @@ -32085,100 +32729,224 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-08", + "last_updated": "2026-03-08", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" }, { - "id": "BAAI/bge-reranker-v2-m3", - "name": "BAAI/bge-reranker-v2-m3", - "display_name": "BAAI/bge-reranker-v2-m3", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" ], "output": [ - "score" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 202752, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "rerank" - }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" + } + ] + }, + "cortecs": { + "id": "cortecs", + "name": "Cortecs", + "display_name": "Cortecs", + "api": "https://api.cortecs.ai/v1", + "doc": "https://api.cortecs.ai/v1/models", + "models": [ { - "id": "netease-youdao/bce-embedding-base_v1", - "name": "netease-youdao/bce-embedding-base_v1", - "display_name": "netease-youdao/bce-embedding-base_v1", + "id": "minimax-m2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" ], "output": [ - "embedding" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 196000, + "output": 196000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "cost": { + "input": 0.34, + "output": 1.34 + }, + "type": "chat" }, { - "id": "netease-youdao/bce-reranker-base_v1", - "name": "netease-youdao/bce-reranker-base_v1", - "display_name": "netease-youdao/bce-reranker-base_v1", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "score" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "cost": { + "input": 0.55, + "output": 2.76 + }, + "type": "chat" }, { - "id": "Kwai-Kolors/Kolors", - "name": "Kwai-Kolors/Kolors", - "display_name": "Kwai-Kolors/Kolors", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "image" + "text" ] }, - "tool_call": false, + "limit": { + "context": 200000, + "output": 200000 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "cost": { + "input": 1.09, + "output": 5.43 + }, + "type": "chat" }, { - "id": "Qwen/Qwen2-VL-72B-Instruct", - "name": "Qwen/Qwen2-VL-72B-Instruct", - "display_name": "Qwen/Qwen2-VL-72B-Instruct", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -32188,62 +32956,131 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 204800, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-04-14", + "last_updated": "2026-04-14", + "cost": { + "input": 1.31, + "output": 4.1, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-Coder-7B-Instruct", - "name": "Qwen/Qwen2.5-Coder-7B-Instruct", - "display_name": "Qwen/Qwen2.5-Coder-7B-Instruct", + "id": "claude-opus4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", + "cost": { + "input": 5.6, + "output": 27.99, + "cache_read": 0.56, + "cache_write": 6.99 + }, + "type": "chat" }, { - "id": "internlm/internlm2_5-7b-chat", - "name": "internlm/internlm2_5-7b-chat", - "display_name": "internlm/internlm2_5-7b-chat", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 65535 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-17", + "cost": { + "input": 1.654, + "output": 11.024 }, "type": "chat" }, { - "id": "Qwen/Qwen2-7B-Instruct", - "name": "Qwen/Qwen2-7B-Instruct", - "display_name": "Qwen/Qwen2-7B-Instruct", + "id": "minimax-m2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ "text" @@ -32253,19 +33090,41 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 400000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "cost": { + "input": 0.39, + "output": 1.57 }, "type": "chat" }, { - "id": "THUDM/glm-4-9b-chat", - "name": "THUDM/glm-4-9b-chat", - "display_name": "THUDM/glm-4-9b-chat", + "id": "kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -32275,19 +33134,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 131000, + "output": 131000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-07-11", + "last_updated": "2025-09-05", + "cost": { + "input": 0.551, + "output": 2.646 + }, "type": "chat" }, { - "id": "BAAI/bge-large-en-v1.5", - "name": "BAAI/bge-large-en-v1.5", - "display_name": "BAAI/bge-large-en-v1.5", + "id": "deepseek-r1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ "text" @@ -32297,19 +33166,41 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 164000, + "output": 164000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", + "cost": { + "input": 0.585, + "output": 2.307 + }, + "type": "chat" }, { - "id": "BAAI/bge-large-zh-v1.5", - "name": "BAAI/bge-large-zh-v1.5", - "display_name": "BAAI/bge-large-zh-v1.5", + "id": "deepseek-v3-0324", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ "text" @@ -32319,19 +33210,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "embedding" + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", + "cost": { + "input": 0.551, + "output": 1.654 + }, + "type": "chat" }, { - "id": "LoRA/Qwen/Qwen2.5-32B-Instruct", - "name": "LoRA/Qwen/Qwen2.5-32B-Instruct", - "display_name": "LoRA/Qwen/Qwen2.5-32B-Instruct", + "id": "codestral-2508", + "name": "Codestral 2508", + "display_name": "Codestral 2508", "modalities": { "input": [ "text" @@ -32341,19 +33242,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 256000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-03", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", + "cost": { + "input": 0.3, + "output": 0.9, + "cache_read": 0.03 + }, "type": "chat" }, { - "id": "LoRA/Qwen/Qwen2.5-14B-Instruct", - "name": "LoRA/Qwen/Qwen2.5-14B-Instruct", - "display_name": "LoRA/Qwen/Qwen2.5-14B-Instruct", + "id": "qwen-2.5-72b-instruct", + "name": "Qwen2.5 72B Instruct", + "display_name": "Qwen2.5 72B Instruct", "modalities": { "input": [ "text" @@ -32363,19 +33275,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 33000, + "output": 33000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2024-09-19", + "last_updated": "2024-09-19", + "cost": { + "input": 0.062, + "output": 0.231 + }, "type": "chat" }, { - "id": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "name": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "display_name": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "id": "deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -32385,20 +33307,35 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 163840, + "output": 163840 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "cost": { + "input": 0.266, + "output": 0.444 + }, "type": "chat" }, { - "id": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", - "name": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", - "display_name": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", + "id": "hermes-4-70b", + "name": "Hermes 4 70B", + "display_name": "Hermes 4 70B", "modalities": { "input": [ "text" @@ -32408,18 +33345,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", + "cost": { + "input": 0.116, + "output": 0.358 + }, + "type": "chat" }, { - "id": "Pro/BAAI/bge-m3", - "name": "Pro/BAAI/bge-m3", - "display_name": "Pro/BAAI/bge-m3", + "id": "devstral-2512", + "name": "Devstral 2 2512", + "display_name": "Devstral 2 2512", "modalities": { "input": [ "text" @@ -32429,63 +33378,97 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262000, + "output": 262000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "embedding" + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" }, { - "id": "Pro/Qwen/Qwen2.5-7B-Instruct", - "name": "Pro/Qwen/Qwen2.5-7B-Instruct", - "display_name": "Pro/Qwen/Qwen2.5-7B-Instruct", + "id": "claude-opus4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 200000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", + "cost": { + "input": 5.98, + "output": 29.89 }, "type": "chat" }, { - "id": "Pro/BAAI/bge-reranker-v2-m3", - "name": "Pro/BAAI/bge-reranker-v2-m3", - "display_name": "Pro/BAAI/bge-reranker-v2-m3", + "id": "glm-4.5-air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", "modalities": { "input": [ "text" ], "output": [ - "score" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "rerank" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-01", + "last_updated": "2025-08-01", + "cost": { + "input": 0.22, + "output": 1.34 + }, + "type": "chat" }, { - "id": "LoRA/Qwen/Qwen2.5-72B-Instruct", - "name": "LoRA/Qwen/Qwen2.5-72B-Instruct", - "display_name": "LoRA/Qwen/Qwen2.5-72B-Instruct", + "id": "minimax-m2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -32495,19 +33478,40 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 196608, + "output": 196608 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "cost": { + "input": 0.32, + "output": 1.18 }, "type": "chat" }, { - "id": "Pro/Qwen/Qwen2-7B-Instruct", - "name": "Pro/Qwen/Qwen2-7B-Instruct", - "display_name": "Pro/Qwen/Qwen2-7B-Instruct", + "id": "glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ "text" @@ -32517,63 +33521,107 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 203000, + "output": 203000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", + "cost": { + "input": 0.09, + "output": 0.53 }, "type": "chat" }, { - "id": "LoRA/Qwen/Qwen2.5-7B-Instruct", - "name": "LoRA/Qwen/Qwen2.5-7B-Instruct", - "display_name": "LoRA/Qwen/Qwen2.5-7B-Instruct", + "id": "devstral-small-2512", + "name": "Devstral Small 2 2512", + "display_name": "Devstral Small 2 2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262000, + "output": 262000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "Pro/THUDM/glm-4-9b-chat", - "name": "Pro/THUDM/glm-4-9b-chat", - "display_name": "Pro/THUDM/glm-4-9b-chat", + "id": "gpt-4.1", + "name": "GPT 4.1", + "display_name": "GPT 4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1047576, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 2.354, + "output": 9.417 + }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-Rumination-32B-0414", - "name": "THUDM/GLM-Z1-Rumination-32B-0414", - "display_name": "THUDM/GLM-Z1-Rumination-32B-0414", + "id": "glm-4.5", + "name": "GLM 4.5", + "display_name": "GLM 4.5", "modalities": { "input": [ "text" @@ -32584,189 +33632,381 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", + "cost": { + "input": 0.67, + "output": 2.46 + }, "type": "chat" }, { - "id": "stabilityai/stable-diffusion-xl-base-1.0", - "name": "stabilityai/stable-diffusion-xl-base-1.0", - "display_name": "stabilityai/stable-diffusion-xl-base-1.0", + "id": "qwen3-coder-next", + "name": "Qwen3 Coder Next 80B", + "display_name": "Qwen3 Coder Next 80B", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, - "tool_call": false, + "limit": { + "context": 256000, + "output": 65536 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-04", + "last_updated": "2026-02-04", + "cost": { + "input": 0.158, + "output": 0.84 + }, + "type": "chat" }, { - "id": "black-forest-labs/FLUX.1-schnell", - "name": "black-forest-labs/FLUX.1-schnell", - "display_name": "black-forest-labs/FLUX.1-schnell", + "id": "minimax-m2.7", + "name": "MiniMax-m2.7", + "display_name": "MiniMax-m2.7", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, - "tool_call": false, + "limit": { + "context": 202752, + "output": 196072 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0.47, + "output": 1.4 + }, + "type": "chat" }, { - "id": "black-forest-labs/FLUX.1-dev", - "name": "black-forest-labs/FLUX.1-dev", - "display_name": "black-forest-labs/FLUX.1-dev", + "id": "intellect-3", + "name": "INTELLECT 3", + "display_name": "INTELLECT 3", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, - { - "id": "Pro/black-forest-labs/FLUX.1-schnell", - "name": "Pro/black-forest-labs/FLUX.1-schnell", - "display_name": "Pro/black-forest-labs/FLUX.1-schnell", - "modalities": { - "input": [ - "text" - ], - "output": [ - "image" - ] + "limit": { + "context": 128000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2025-11-26", + "last_updated": "2025-11-26", + "cost": { + "input": 0.219, + "output": 1.202 + }, + "type": "chat" }, { - "id": "stabilityai/stable-diffusion-3-5-large", - "name": "stabilityai/stable-diffusion-3-5-large", - "display_name": "stabilityai/stable-diffusion-3-5-large", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, - "tool_call": false, + "limit": { + "context": 16384, + "output": 16384 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", + "cost": { + "input": 0.099, + "output": 0.33 + }, + "type": "chat" }, { - "id": "fishaudio/fish-speech-1.4", - "name": "fishaudio/fish-speech-1.4", - "display_name": "fishaudio/fish-speech-1.4", + "id": "qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, - "tool_call": false, + "limit": { + "context": 128000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-11", + "last_updated": "2025-09-11", + "cost": { + "input": 0.164, + "output": 1.311 + }, + "type": "chat" }, { - "id": "RVC-Boss/GPT-SoVITS", - "name": "RVC-Boss/GPT-SoVITS", - "display_name": "RVC-Boss/GPT-SoVITS", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, - "tool_call": false, + "limit": { + "context": 262000, + "output": 262000 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", + "cost": { + "input": 0.656, + "output": 2.731 + }, + "type": "chat" }, { - "id": "fishaudio/fish-speech-1.5", - "name": "fishaudio/fish-speech-1.5", - "display_name": "fishaudio/fish-speech-1.5", + "id": "nemotron-3-super-120b-a12b", + "name": "Nemotron 3 Super 120B A12B", + "display_name": "Nemotron 3 Super 120B A12B", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, - "tool_call": false, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-03-11", + "last_updated": "2026-03-11", + "cost": { + "input": 0.266, + "output": 0.799 + }, + "type": "chat" }, { - "id": "black-forest-labs/FLUX.1-pro", - "name": "black-forest-labs/FLUX.1-pro", - "display_name": "black-forest-labs/FLUX.1-pro", + "id": "nova-pro-v1", + "name": "Nova Pro 1.0", + "display_name": "Nova Pro 1.0", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, - "tool_call": false, + "limit": { + "context": 300000, + "output": 5000 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false - } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", + "cost": { + "input": 1.016, + "output": 4.061 + }, + "type": "chat" }, { - "id": "LoRA/black-forest-labs/FLUX.1-dev", - "name": "LoRA/black-forest-labs/FLUX.1-dev", - "display_name": "LoRA/black-forest-labs/FLUX.1-dev", + "id": "claude-4-5-sonnet", + "name": "Claude 4.5 Sonnet", + "display_name": "Claude 4.5 Sonnet", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "image" + "text" ] }, - "tool_call": false, + "limit": { + "context": 200000, + "output": 200000 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "cost": { + "input": 3.259, + "output": 16.296 + }, + "type": "chat" }, { - "id": "SeedLLM/Seed-Rice-7B", - "name": "SeedLLM/Seed-Rice-7B", - "display_name": "SeedLLM/Seed-Rice-7B", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -32776,39 +34016,43 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 131000, + "output": 131000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "cost": { + "input": 0.062, + "output": 0.408 }, "type": "chat" - } - ] - }, - "submodel": { - "id": "submodel", - "name": "submodel", - "display_name": "submodel", - "api": "https://llm.submodel.ai/v1", - "doc": "https://submodel.gitbook.io", - "models": [ + }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -32816,50 +34060,55 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.2, - "output": 0.3 + "input": 3.307, + "output": 16.536 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "claude-opus4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 1000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.2, - "output": 0.8 + "input": 5.98, + "output": 29.89 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -32869,40 +34118,29 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "knowledge": "2025-01", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 0.2, - "output": 0.6 + "input": 0.441, + "output": 1.984 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5-Air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "llama-3.1-405b-instruct", + "name": "Llama 3.1 405B Instruct", + "display_name": "Llama 3.1 405B Instruct", "modalities": { "input": [ "text" @@ -32912,8 +34150,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -32922,18 +34160,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.1, - "output": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5-FP8", - "name": "GLM 4.5 FP8", - "display_name": "GLM 4.5 FP8", + "id": "glm-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ "text" @@ -32943,8 +34182,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 198000, + "output": 198000 }, "temperature": true, "tool_call": true, @@ -32952,20 +34191,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.45, + "output": 2.23 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "gpt-oss-120b", + "name": "GPT Oss 120b", + "display_name": "GPT Oss 120b", "modalities": { "input": [ "text" @@ -32975,29 +34226,34 @@ ] }, "limit": { - "context": 75000, - "output": 163840 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "open_weights": true, + "knowledge": "2024-01", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3-0324", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "mixtral-8x7B-instruct-v0.1", + "name": "Mixtral 8x7B Instruct v0.1", + "display_name": "Mixtral 8x7B Instruct v0.1", "modalities": { "input": [ "text" @@ -33007,28 +34263,30 @@ ] }, "limit": { - "context": 75000, - "output": 163840 + "context": 32000, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "open_weights": true, + "knowledge": "2023-09", + "release_date": "2023-12-11", + "last_updated": "2023-12-11", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.438, + "output": 0.68 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", + "id": "glm-5", + "name": "GLM 5", + "display_name": "GLM 5", "modalities": { "input": [ "text" @@ -33038,8 +34296,8 @@ ] }, "limit": { - "context": 75000, - "output": 163840 + "context": 202752, + "output": 202752 }, "temperature": true, "tool_call": true, @@ -33059,30 +34317,31 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.5, - "output": 2.15 + "input": 1.08, + "output": 3.44 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -33092,43 +34351,43 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.1, - "output": 0.5 + "input": 0.81, + "output": 3.54, + "cache_read": 0.2 }, "type": "chat" - } - ] - }, - "minimax-coding-plan": { - "id": "minimax-coding-plan", - "name": "MiniMax Coding Plan (minimax.io)", - "display_name": "MiniMax Coding Plan (minimax.io)", - "api": "https://api.minimax.io/anthropic/v1", - "doc": "https://platform.minimax.io/docs/coding-plan/intro", - "models": [ + }, { - "id": "MiniMax-M2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "claude-4-6-sonnet", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 128000 + "context": 1000000, + "output": 1000000 }, "temperature": true, "tool_call": true, @@ -33136,64 +34395,55 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0, - "output": 0 + "input": 3.59, + "output": 17.92 }, "type": "chat" }, { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "mistral-large-2512", + "name": "Mistral Large 3 2512", + "display_name": "Mistral Large 3 2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2025-12", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.5, + "output": 1.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -33203,8 +34453,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1048576, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -33225,20 +34475,20 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 1.553, + "output": 3.106, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "MiniMax-M2.7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "qwen3.5-122b-a10b", + "name": "Qwen3.5 122B A10B", + "display_name": "Qwen3.5 122B A10B", "modalities": { "input": [ "text" @@ -33248,8 +34498,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -33270,20 +34520,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2026-01", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.444, + "output": 3.106 }, "type": "chat" }, { - "id": "MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "qwen3.5-397b-a17b", + "name": "Qwen3.5 397B A17B", + "display_name": "Qwen3.5 397B A17B", "modalities": { "input": [ "text" @@ -33293,8 +34542,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 250000, + "output": 250000 }, "temperature": true, "tool_call": true, @@ -33304,23 +34553,30 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2026-01", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "MiniMax-M2.5-highspeed", - "name": "MiniMax-M2.5-highspeed", - "display_name": "MiniMax-M2.5-highspeed", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -33330,8 +34586,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1048576, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -33341,66 +34597,64 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2026-02-13", - "last_updated": "2026-02-13", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.133, + "output": 0.266, + "cache_read": 0.028 }, "type": "chat" - } - ] - }, - "perplexity": { - "id": "perplexity", - "name": "Perplexity", - "display_name": "Perplexity", - "doc": "https://docs.perplexity.ai", - "models": [ + }, { - "id": "sonar-pro", - "name": "Sonar Pro", - "display_name": "Sonar Pro", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 262000, + "output": 262000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "cost": { - "input": 3, - "output": 15 + "input": 0.053, + "output": 0.222 }, "type": "chat" }, { - "id": "sonar-deep-research", - "name": "Perplexity Sonar Deep Research", - "display_name": "Perplexity Sonar Deep Research", + "id": "llama-3.3-70b-instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -33410,31 +34664,39 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131000, + "output": 131000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-02-01", - "last_updated": "2025-09-01", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 2, - "output": 8, - "reasoning": 3 + "input": 0.089, + "output": 0.275 }, "type": "chat" - }, + } + ] + }, + "baseten": { + "id": "baseten", + "name": "Baseten", + "display_name": "Baseten", + "api": "https://inference.baseten.co/v1", + "doc": "https://docs.baseten.co/development/model-apis/overview", + "models": [ { - "id": "sonar", - "name": "Sonar", - "display_name": "Sonar", + "id": "deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text" @@ -33444,72 +34706,61 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 164000, + "output": 131000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "open_weights": true, + "release_date": "2025-08-25", + "last_updated": "2025-08-25", "cost": { - "input": 1, - "output": 1 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "sonar-reasoning-pro", - "name": "Sonar Reasoning Pro", - "display_name": "Sonar Reasoning Pro", + "id": "deepseek-ai/DeepSeek-V3-0324", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 164000, + "output": 131000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 2, - "output": 8 + "input": 0.77, + "output": 0.77 }, "type": "chat" - } - ] - }, - "deepseek": { - "id": "deepseek", - "name": "DeepSeek", - "display_name": "DeepSeek", - "api": "https://api.deepseek.com", - "doc": "https://api-docs.deepseek.com/zh-cn/quick_start/pricing", - "models": [ + }, { - "id": "deepseek-chat", - "name": "DeepSeek Chat", - "display_name": "DeepSeek Chat", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -33519,30 +34770,41 @@ ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 163800, + "output": 131100 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2025-09", - "release_date": "2024-12-26", - "last_updated": "2026-04-24", + "knowledge": "2025-10", + "release_date": "2025-12-01", + "last_updated": "2026-03-06", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 0.3, + "output": 0.45 }, "type": "chat" }, { - "id": "deepseek-reasoner", - "name": "DeepSeek Reasoner", - "display_name": "DeepSeek Reasoner", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -33552,10 +34814,10 @@ ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -33564,50 +34826,42 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Compatibility alias for deepseek-v4-flash thinking mode." ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-01-20", - "last_updated": "2026-04-24", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2026-03-06", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 0.6, + "output": 2.5 }, "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -33618,39 +34872,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Thinking mode is controlled through the thinking parameter; non-thinking mode disables reasoning." ] } }, "attachment": true, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text" @@ -33660,8 +34905,8 @@ ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 262144, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -33672,48 +34917,29 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Thinking mode is controlled through the thinking parameter; non-thinking mode disables reasoning." ] } }, "attachment": true, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "knowledge": "2025-12", + "release_date": "2026-01-30", + "last_updated": "2026-02-12", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 0.6, + "output": 3 }, "type": "chat" - } - ] - }, - "llama": { - "id": "llama", - "name": "Llama", - "display_name": "Llama", - "api": "https://api.llama.com/compat/v1/", - "doc": "https://llama.developer.meta.com/docs/models", - "models": [ + }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi K2 Instruct 0905", + "display_name": "Kimi K2 Instruct 0905", "modalities": { "input": [ "text" @@ -33723,30 +34949,30 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2025-08", + "release_date": "2025-09-05", + "last_updated": "2026-03-06", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 2.5 }, "type": "chat" }, { - "id": "cerebras-llama-4-maverick-17b-128e-instruct", - "name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", - "display_name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", - "modalities": { + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", + "modalities": { "input": [ "text" ], @@ -33756,28 +34982,34 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.5 }, "type": "chat" }, { - "id": "llama-3.3-8b-instruct", - "name": "Llama-3.3-8B-Instruct", - "display_name": "Llama-3.3-8B-Instruct", + "id": "zai-org/GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -33787,29 +35019,41 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "cerebras-llama-4-scout-17b-16e-instruct", - "name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", - "display_name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", + "id": "zai-org/GLM-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -33819,29 +35063,41 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2026-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0, - "output": 0 + "input": 0.95, + "output": 3.15 }, "type": "chat" }, { - "id": "groq-llama-4-maverick-17b-128e-instruct", - "name": "Groq-Llama-4-Maverick-17B-128E-Instruct", - "display_name": "Groq-Llama-4-Maverick-17B-128E-Instruct", + "id": "zai-org/GLM-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ "text" @@ -33851,104 +35107,122 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 200000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2025-08-31", + "release_date": "2025-09-16", + "last_updated": "2025-09-16", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "llama-4-scout-17b-16e-instruct-fp8", - "name": "Llama-4-Scout-17B-16E-Instruct-FP8", - "display_name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "id": "nvidia/Nemotron-120B-A12B", + "name": "Nemotron 3 Super", + "display_name": "Nemotron 3 Super", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 32678 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2026-02", + "release_date": "2026-03-11", + "last_updated": "2026-03-11", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 0.75 }, "type": "chat" }, { - "id": "llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", - "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 204000, + "output": 204000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2026-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 1.2 }, "type": "chat" - } - ] - }, - "fireworks-ai": { - "id": "fireworks-ai", - "name": "Fireworks AI", - "display_name": "Fireworks AI", - "api": "https://api.fireworks.ai/inference/v1/", - "doc": "https://fireworks.ai/docs/", - "models": [ + }, { - "id": "accounts/fireworks/models/glm-5p1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "deepseek-ai/DeepSeek-V4-Pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -33958,8 +35232,8 @@ ] }, "limit": { - "context": 202800, - "output": 131072 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -33980,19 +35254,62 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 1.74, + "output": 3.48, + "cache_read": 0.15 + }, + "type": "chat" + } + ] + }, + "llama": { + "id": "llama", + "name": "Llama", + "display_name": "Llama", + "api": "https://api.llama.com/compat/v1/", + "doc": "https://llama.developer.meta.com/docs/models", + "models": [ + { + "id": "llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "cost": { + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "accounts/fireworks/models/deepseek-v3p2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "cerebras-llama-4-scout-17b-16e-instruct", + "name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", + "display_name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", "modalities": { "input": [ "text" @@ -34002,42 +35319,29 @@ ] }, "limit": { - "context": 160000, - "output": 160000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2025-01", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.56, - "output": 1.68, - "cache_read": 0.28 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "accounts/fireworks/models/minimax-m2p5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "llama-3.3-8b-instruct", + "name": "Llama-3.3-8B-Instruct", + "display_name": "Llama-3.3-8B-Instruct", "modalities": { "input": [ "text" @@ -34047,41 +35351,62 @@ ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0, + "output": 0 }, - "attachment": false, + "type": "chat" + }, + { + "id": "llama-4-scout-17b-16e-instruct-fp8", + "name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "display_name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "accounts/fireworks/models/glm-4p5-air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "cerebras-llama-4-maverick-17b-128e-instruct", + "name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", + "display_name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", "modalities": { "input": [ "text" @@ -34091,30 +35416,29 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-01", - "last_updated": "2025-08-01", + "knowledge": "2025-01", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.22, - "output": 0.88 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "accounts/fireworks/models/glm-5", - "name": "GLM 5", - "display_name": "GLM 5", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -34124,41 +35448,29 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "accounts/fireworks/models/deepseek-v3p1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "groq-llama-4-maverick-17b-128e-instruct", + "name": "Groq-Llama-4-Maverick-17B-128E-Instruct", + "display_name": "Groq-Llama-4-Maverick-17B-128E-Instruct", "modalities": { "input": [ "text" @@ -34168,42 +35480,51 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "knowledge": "2025-01", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.56, - "output": 1.68 + "input": 0, + "output": 0 }, "type": "chat" - }, + } + ] + }, + "novita-ai": { + "id": "novita-ai", + "name": "NovitaAI", + "display_name": "NovitaAI", + "api": "https://api.novita.ai/openai", + "doc": "https://novita.ai/docs/guides/introduction", + "models": [ { - "id": "accounts/fireworks/models/kimi-k2p6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -34222,21 +35543,22 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "accounts/fireworks/models/kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "moonshotai/kimi-k2-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -34246,8 +35568,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -34257,52 +35579,49 @@ "attachment": false, "open_weights": true, "knowledge": "2024-10", - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 1, - "output": 3 + "input": 0.6, + "output": 2.5 }, "type": "chat" }, { - "id": "accounts/fireworks/models/qwen3p6-plus", - "name": "Qwen 3.6 Plus", - "display_name": "Qwen 3.6 Plus", + "id": "moonshotai/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-04", - "last_updated": "2026-04-04", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-11", + "last_updated": "2025-07-11", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.1 + "input": 0.57, + "output": 2.3 }, "type": "chat" }, { - "id": "accounts/fireworks/models/minimax-m2p1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -34312,8 +35631,8 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -34334,74 +35653,68 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "release_date": "2025-11-07", + "last_updated": "2025-11-07", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 0.6, + "output": 2.5 }, "type": "chat" }, { - "id": "accounts/fireworks/models/minimax-m2p7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "openai/gpt-oss-20b", + "name": "OpenAI: GPT OSS 20B", + "display_name": "OpenAI: GPT OSS 20B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-04-12", - "last_updated": "2026-04-12", + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 0.04, + "output": 0.15 }, "type": "chat" }, { - "id": "accounts/fireworks/models/glm-4p7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "openai/gpt-oss-120b", + "name": "OpenAI GPT OSS 120B", + "display_name": "OpenAI GPT OSS 120B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 198000, - "output": 198000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -34411,31 +35724,23 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.3 + "input": 0.05, + "output": 0.25 }, "type": "chat" }, { - "id": "accounts/fireworks/models/glm-4p5", - "name": "GLM 4.5", - "display_name": "GLM 4.5", + "id": "zai-org/glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -34445,7 +35750,7 @@ ] }, "limit": { - "context": 131072, + "context": 204800, "output": 131072 }, "temperature": true, @@ -34467,32 +35772,65 @@ }, "attachment": false, "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", + "cost": { + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 + }, + "type": "chat" + }, + { + "id": "zai-org/glm-4.5-air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 98304 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "release_date": "2025-10-13", + "last_updated": "2025-10-13", "cost": { - "input": 0.55, - "output": 2.19 + "input": 0.13, + "output": 0.85 }, "type": "chat" }, { - "id": "accounts/fireworks/models/kimi-k2p5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "zai-org/glm-4.5v", + "name": "GLM 4.5V", + "display_name": "GLM 4.5V", "modalities": { "input": [ "text", - "image", - "video" + "video", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 65536, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -34500,33 +35838,22 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "cost": { "input": 0.6, - "output": 3, - "cache_read": 0.1 + "output": 1.8, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "accounts/fireworks/models/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "zai-org/glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ "text" @@ -34536,8 +35863,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -34552,18 +35879,20 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.05, - "output": 0.2 + "input": 0.07, + "output": 0.4, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "accounts/fireworks/models/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "zai-org/glm-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ "text" @@ -34573,8 +35902,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -34584,23 +35913,30 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.55, + "output": 2.2, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "accounts/fireworks/models/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "zai-org/glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -34610,8 +35946,8 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -34632,19 +35968,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { "input": 0.6, - "output": 2.5, - "cache_read": 0.3 + "output": 2.2, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "accounts/fireworks/routers/kimi-k2p5-turbo", - "name": "Kimi K2.5 Turbo", - "display_name": "Kimi K2.5 Turbo", + "id": "zai-org/autoglm-phone-9b-multilingual", + "name": "AutoGLM-Phone-9B-Multilingual", + "display_name": "AutoGLM-Phone-9B-Multilingual", "modalities": { "input": [ "text", @@ -34655,8 +35991,39 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 65536, + "output": 65536 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-12-10", + "last_updated": "2025-12-10", + "cost": { + "input": 0.035, + "output": 0.138 + }, + "type": "chat" + }, + { + "id": "zai-org/glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -34677,20 +36044,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "accounts/fireworks/models/deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "zai-org/glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -34700,8 +36066,8 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 202800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -34722,41 +36088,31 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2026-02-11", + "last_updated": "2026-02-12", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.15 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" - } - ] - }, - "kimi-for-coding": { - "id": "kimi-for-coding", - "name": "Kimi For Coding", - "display_name": "Kimi For Coding", - "api": "https://api.kimi.com/coding/v1", - "doc": "https://www.kimi.com/coding/docs/en/third-party-agents.html", - "models": [ + }, { - "id": "k2p6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "zai-org/glm-4.6v", + "name": "GLM 4.6V", + "display_name": "GLM 4.6V", "modalities": { "input": [ "text", - "image", - "video" + "video", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 131072, "output": 32768 }, "temperature": true, @@ -34765,60 +36121,54 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04", - "last_updated": "2026-04", + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.3, + "output": 0.9, + "cache_read": 0.055 }, "type": "chat" }, { - "id": "k2p5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "baichuan/baichuan-m2-32b", + "name": "baichuan-m2-32b", + "display_name": "baichuan-m2-32b", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", + "knowledge": "2024-12", + "release_date": "2025-08-13", + "last_updated": "2025-08-13", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.07, + "output": 0.07 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "minimax/minimax-m2.1", + "name": "Minimax M2.1", + "display_name": "Minimax M2.1", "modalities": { "input": [ "text" @@ -34828,14 +36178,13 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -34850,30 +36199,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-11", - "last_updated": "2025-12", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" - } - ] - }, - "moark": { - "id": "moark", - "name": "Moark", - "display_name": "Moark", - "api": "https://moark.com/v1", - "doc": "https://moark.com/docs/openapi/v1#tag/%E6%96%87%E6%9C%AC%E7%94%9F%E6%88%90", - "models": [ + }, { - "id": "GLM-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "minimax/minimax-m2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ "text" @@ -34905,19 +36243,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 3.5, - "output": 14 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "minimax/minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -34928,7 +36266,7 @@ }, "limit": { "context": 204800, - "output": 131072 + "output": 131100 }, "temperature": true, "tool_call": true, @@ -34938,30 +36276,28 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": false, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 2.1, - "output": 8.4 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" - } - ] - }, - "opencode-go": { - "id": "opencode-go", - "name": "OpenCode Go", - "display_name": "OpenCode Go", - "api": "https://opencode.ai/zen/go/v1", - "doc": "https://opencode.ai/docs/zen", - "models": [ + }, { - "id": "minimax-m2.7", + "id": "minimax/minimax-m2.7", "name": "MiniMax M2.7", "display_name": "MiniMax M2.7", "modalities": { @@ -34995,7 +36331,6 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", "release_date": "2026-03-18", "last_updated": "2026-03-18", "cost": { @@ -35006,22 +36341,20 @@ "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "minimax/minimax-m2.5-highspeed", + "name": "MiniMax M2.5 Highspeed", + "display_name": "MiniMax M2.5 Highspeed", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 204800, + "output": 131100 }, "temperature": true, "tool_call": true, @@ -35040,22 +36373,21 @@ ] } }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "attachment": false, + "open_weights": false, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { "input": 0.6, - "output": 3, - "cache_read": 0.1 + "output": 2.4, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "mimo-v2.5-pro", - "name": "MiMo V2.5 Pro", - "display_name": "MiMo V2.5 Pro", + "id": "kwaipilot/kat-coder-pro", + "name": "Kat Coder Pro", + "display_name": "Kat Coder Pro", "modalities": { "input": [ "text" @@ -35065,47 +36397,29 @@ ] }, "limit": { - "context": 1048576, + "context": 256000, "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2026-01-05", + "last_updated": "2026-01-05", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2, - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "nousresearch/hermes-2-pro-llama-3-8b", + "name": "Hermes 2 Pro Llama 3 8B", + "display_name": "Hermes 2 Pro Llama 3 8B", "modalities": { "input": [ "text" @@ -35115,191 +36429,121 @@ ] }, "limit": { - "context": 202752, - "output": 32768 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2024-06-27", + "last_updated": "2024-06-27", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 0.14, + "output": 0.14 }, "type": "chat" }, { - "id": "mimo-v2-omni", - "name": "MiMo V2 Omni", - "display_name": "MiMo V2 Omni", + "id": "sao10K/l3-8b-lunaris", + "name": "Sao10k L3 8B Lunaris\t", + "display_name": "Sao10k L3 8B Lunaris\t", "modalities": { "input": [ - "text", - "image", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 128000 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2024-11-28", + "last_updated": "2024-11-28", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08 + "input": 0.05, + "output": 0.05 }, "type": "chat" }, { - "id": "mimo-v2.5", - "name": "MiMo V2.5", - "display_name": "MiMo V2.5", + "id": "sao10K/l31-70b-euryale-v2.2", + "name": "L31 70B Euryale V2.2", + "display_name": "L31 70B Euryale V2.2", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2024-09-19", + "last_updated": "2024-09-19", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08, - "context_over_200k": { - "input": 0.8, - "output": 4, - "cache_read": 0.16 - } + "input": 1.48, + "output": 1.48 }, "type": "chat" }, { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "sao10K/L3-8B-stheno-v3.2", + "name": "L3 8B Stheno V3.2", + "display_name": "L3 8B Stheno V3.2", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 8192, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "attachment": false, + "open_weights": true, + "release_date": "2024-11-29", + "last_updated": "2024-11-29", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "cache_write": 0.625 + "input": 0.05, + "output": 0.05 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "sao10K/l3-70b-euryale-v2.1", + "name": "L3 70B Euryale V2.1\t", + "display_name": "L3 70B Euryale V2.1\t", "modalities": { "input": [ "text" @@ -35309,92 +36553,63 @@ ] }, "limit": { - "context": 202752, - "output": 32768 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-04-07", - "last_updated": "2026-04-07", + "release_date": "2024-06-18", + "last_updated": "2024-06-18", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 1.48, + "output": 1.48 }, "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "paddlepaddle/paddleocr-vl", + "name": "PaddleOCR-VL", + "display_name": "PaddleOCR-VL", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2025-10-22", + "last_updated": "2025-10-22", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.0028 + "input": 0.02, + "output": 0.02 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "inclusionai/ling-2.6-1t", + "name": "Ling-2.6-1T", + "display_name": "Ling-2.6-1T", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" @@ -35402,41 +36617,27 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "inclusionai/ling-2.6-flash", + "name": "Ling-2.6-flash", + "display_name": "Ling-2.6-flash", "modalities": { "input": [ "text" @@ -35446,42 +36647,29 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", "release_date": "2026-04-24", "last_updated": "2026-04-24", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.0145 + "input": 0.1, + "output": 0.3, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "mistralai/mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -35491,92 +36679,61 @@ ] }, "limit": { - "context": 204800, - "output": 65536 + "context": 60288, + "output": 16000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2024-07-30", + "last_updated": "2024-07-30", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 0.04, + "output": 0.17 }, "type": "chat" }, { - "id": "mimo-v2-pro", - "name": "MiMo V2 Pro", - "display_name": "MiMo V2 Pro", + "id": "qwen/qwen3-vl-235b-a22b-instruct", + "name": "Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen3 VL 235B A22B Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 128000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2, - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0.3, + "output": 1.5 }, "type": "chat" }, { - "id": "qwen3.5-plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "qwen/qwen2.5-vl-72b-instruct", + "name": "Qwen2.5 VL 72B Instruct", + "display_name": "Qwen2.5 VL 72B Instruct", "modalities": { "input": [ "text", @@ -35588,52 +36745,28 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "open_weights": true, + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0.2, - "output": 1.2, - "cache_read": 0.02, - "cache_write": 0.25 + "input": 0.8, + "output": 0.8 }, "type": "chat" - } - ] - }, - "databricks": { - "id": "databricks", - "name": "Databricks", - "display_name": "Databricks", - "api": "https://${DATABRICKS_HOST}/ai-gateway/mlflow/v1", - "doc": "https://docs.databricks.com/aws/en/machine-learning/foundation-models/", - "models": [ + }, { - "id": "databricks-gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "qwen/qwen2.5-7b-instruct", + "name": "Qwen2.5 7B Instruct", + "display_name": "Qwen2.5 7B Instruct", "modalities": { "input": [ "text" @@ -35643,32 +36776,33 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 32000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.072, - "output": 0.28 + "input": 0.07, + "output": 0.07 }, "type": "chat" }, { - "id": "databricks-gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "qwen/qwen3-vl-235b-a22b-thinking", + "name": "Qwen3 VL 235B A22B Thinking", + "display_name": "Qwen3 VL 235B A22B Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -35679,140 +36813,113 @@ "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 0.05, - "output": 0.2 + "input": 0.98, + "output": 3.95 }, "type": "chat" }, { - "id": "databricks-claude-haiku-4-5", - "name": "Claude Haiku 4.5 (latest)", - "display_name": "Claude Haiku 4.5 (latest)", + "id": "qwen/qwen-2.5-72b-instruct", + "name": "Qwen 2.5 72B Instruct", + "display_name": "Qwen 2.5 72B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-10-15", + "last_updated": "2024-10-15", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.38, + "output": 0.4 }, "type": "chat" }, { - "id": "databricks-claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "qwen/qwen3-30b-a3b-fp8", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 40960, + "output": 20000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.09, + "output": 0.45 }, "type": "chat" }, { - "id": "databricks-gemini-3-pro", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "qwen/qwen3.5-122b-a10b", + "name": "Qwen3.5-122B-A10B", + "display_name": "Qwen3.5-122B-A10B", "modalities": { "input": [ "text", "image", - "video", - "audio", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -35820,214 +36927,193 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "open_weights": true, + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.4, + "output": 3.2 }, "type": "chat" }, { - "id": "databricks-gemini-3-1-pro", - "name": "Gemini 3.1 Pro Preview Custom Tools", - "display_name": "Gemini 3.1 Pro Preview Custom Tools", + "id": "qwen/qwen3-omni-30b-a3b-instruct", + "name": "Qwen3 Omni 30B A3B Instruct", + "display_name": "Qwen3 Omni 30B A3B Instruct", "modalities": { "input": [ "text", - "image", "video", "audio", - "pdf" + "image" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 65536, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.25, + "output": 0.97, + "input_audio": 2.2, + "output_audio": 1.788 }, "type": "chat" }, { - "id": "databricks-gpt-5-4-mini", - "name": "GPT-5.4 mini", - "display_name": "GPT-5.4 mini", + "id": "qwen/qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2025-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 2.11, + "output": 8.45 }, "type": "chat" }, { - "id": "databricks-claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "qwen/qwen3.5-397b-a17b", + "name": "Qwen3.5-397B-A17B", + "display_name": "Qwen3.5-397B-A17B", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 262144, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "open_weights": true, + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "databricks-gemini-2-5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "qwen/qwen3-coder-next", + "name": "Qwen3 Coder Next", + "display_name": "Qwen3 Coder Next", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-03", + "last_updated": "2026-02-03", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 0.2, + "output": 1.5 }, "type": "chat" }, { - "id": "databricks-gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "qwen/qwen3-omni-30b-a3b-thinking", + "name": "Qwen3 Omni 30B A3B Thinking", + "display_name": "Qwen3 Omni 30B A3B Thinking", "modalities": { "input": [ "text", + "audio", + "video", "image" ], "output": [ @@ -36035,273 +37121,236 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 65536, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 0.25, + "output": 0.97, + "input_audio": 2.2, + "output_audio": 1.788 }, "type": "chat" }, { - "id": "databricks-gpt-5-4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", - "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, + "attachment": false, + "open_weights": true, + "release_date": "2025-09-10", + "last_updated": "2025-09-10", + "cost": { + "input": 0.15, + "output": 1.5 + }, "type": "chat" }, { - "id": "databricks-gemini-3-1-flash-lite", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "qwen/qwen3-4b-fp8", + "name": "Qwen3 4B", + "display_name": "Qwen3 4B", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 20000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "input": 0.03, + "output": 0.03 }, "type": "chat" }, { - "id": "databricks-gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "qwen/qwen3-235b-a22b-fp8", + "name": "Qwen3 235B A22B", + "display_name": "Qwen3 235B A22B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 40960, + "output": 20000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "databricks-claude-opus-4-1", - "name": "Claude Opus 4.1 (latest)", - "display_name": "Claude Opus 4.1 (latest)", + "id": "qwen/qwen-mt-plus", + "name": "Qwen MT Plus", + "display_name": "Qwen MT Plus", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 16384, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" - }, - { - "id": "databricks-gpt-5-2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 400000, - "output": 128000 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "release_date": "2025-09-03", + "last_updated": "2025-09-03", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.25, + "output": 0.75 }, "type": "chat" }, { - "id": "databricks-gpt-5-5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "qwen/qwen3-vl-30b-a3b-thinking", + "name": "qwen/qwen3-vl-30b-a3b-thinking", + "display_name": "qwen/qwen3-vl-30b-a3b-thinking", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "open_weights": true, + "release_date": "2025-10-11", + "last_updated": "2025-10-11", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 0.2, + "output": 1 }, "type": "chat" }, { - "id": "databricks-gemini-3-flash", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "qwen/qwen3.5-35b-a3b", + "name": "Qwen3.5-35B-A3B", + "display_name": "Qwen3.5-35B-A3B", "modalities": { "input": [ "text", "image", - "video", - "audio", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, @@ -36310,319 +37359,279 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "open_weights": true, + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "context_over_200k": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 - } + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "databricks-claude-opus-4-5", - "name": "Claude Opus 4.5 (latest)", - "display_name": "Claude Opus 4.5 (latest)", + "id": "qwen/qwen3-32b-fp8", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 40960, + "output": 20000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.1, + "output": 0.45 }, "type": "chat" }, { - "id": "databricks-gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "qwen/qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.09, + "output": 0.58 }, "type": "chat" }, { - "id": "databricks-claude-sonnet-4", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "qwen/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.3, + "output": 1.3 }, "type": "chat" }, { - "id": "databricks-gpt-5-1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "qwen/qwen3-vl-8b-instruct", + "name": "qwen/qwen3-vl-8b-instruct", + "display_name": "qwen/qwen3-vl-8b-instruct", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": true, + "release_date": "2025-10-17", + "last_updated": "2025-10-17", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.08, + "output": 0.5 }, "type": "chat" }, { - "id": "databricks-claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "qwen/qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22b Thinking 2507", + "display_name": "Qwen3 235B A22b Thinking 2507", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], "interleaved": true, "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.3, + "output": 3 }, "type": "chat" }, { - "id": "databricks-gemini-2-5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "qwen/qwen3-coder-30b-a3b-instruct", + "name": "Qwen3 Coder 30b A3B Instruct", + "display_name": "Qwen3 Coder 30b A3B Instruct", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 160000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-10-09", + "last_updated": "2025-10-09", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.03, - "input_audio": 1 + "input": 0.07, + "output": 0.27 }, "type": "chat" }, { - "id": "databricks-gpt-5-4-nano", - "name": "GPT-5.4 nano", - "display_name": "GPT-5.4 nano", + "id": "qwen/qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "release_date": "2025-09-10", + "last_updated": "2025-09-10", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 0.15, + "output": 1.5 }, "type": "chat" }, { - "id": "databricks-claude-sonnet-4-5", - "name": "Claude Sonnet 4.5 (latest)", - "display_name": "Claude Sonnet 4.5 (latest)", + "id": "qwen/qwen3.5-27b", + "name": "Qwen3.5-27B", + "display_name": "Qwen3.5-27B", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -36630,66 +37639,64 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": true, + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.3, + "output": 2.4 }, "type": "chat" - } - ] - }, - "io-net": { - "id": "io-net", - "name": "IO.NET", - "display_name": "IO.NET", - "api": "https://api.intelligence.io.solutions/api/v1", - "doc": "https://io.net/docs/guides/intelligence/io-intelligence", - "models": [ + }, { - "id": "Intel/Qwen3-Coder-480B-A35B-Instruct-int4-mixed-ar", - "name": "Qwen 3 Coder 480B", - "display_name": "Qwen 3 Coder 480B", + "id": "qwen/qwen3-vl-30b-a3b-instruct", + "name": "qwen/qwen3-vl-30b-a3b-instruct", + "display_name": "qwen/qwen3-vl-30b-a3b-instruct", "modalities": { "input": [ - "text" + "text", + "video", + "image" ], "output": [ "text" ] }, "limit": { - "context": 106000, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-15", - "last_updated": "2025-01-15", + "release_date": "2025-10-11", + "last_updated": "2025-10-11", "cost": { - "input": 0.22, - "output": 0.95, - "cache_read": 0.11, - "cache_write": 0.44 + "input": 0.2, + "output": 0.7 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "name": "Qwen 3 Next 80B Instruct", - "display_name": "Qwen 3 Next 80B Instruct", + "id": "qwen/qwen3-8b-fp8", + "name": "Qwen3 8B", + "display_name": "Qwen3 8B", "modalities": { "input": [ "text" @@ -36699,34 +37706,33 @@ ] }, "limit": { - "context": 262144, - "output": 4096 + "context": 128000, + "output": 20000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-10", - "last_updated": "2025-01-10", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.1, - "output": 0.8, - "cache_read": 0.05, - "cache_write": 0.2 + "input": 0.035, + "output": 0.138 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen 3 235B Thinking", - "display_name": "Qwen 3 235B Thinking", + "id": "google/gemma-4-26b-a4b-it", + "name": "Gemma 4 26B A4B", + "display_name": "Gemma 4 26B A4B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -36734,7 +37740,7 @@ }, "limit": { "context": 262144, - "output": 4096 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -36742,34 +37748,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.11, - "output": 0.6, - "cache_read": 0.055, - "cache_write": 0.22 + "input": 0.13, + "output": 0.4 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-32B-Instruct", - "name": "Qwen 2.5 VL 32B Instruct", - "display_name": "Qwen 2.5 VL 32B Instruct", + "id": "google/gemma-3-27b-it", + "name": "Gemma 3 27B", + "display_name": "Gemma 3 27B", "modalities": { "input": [ "text", @@ -36780,139 +37772,124 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 98304, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0.05, - "output": 0.22, - "cache_read": 0.025, - "cache_write": 0.1 + "input": 0.119, + "output": 0.2 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "google/gemma-4-31b-it", + "name": "Gemma 4 31B", + "display_name": "Gemma 4 31B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-11-15", - "last_updated": "2024-11-15", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.4, - "output": 1.75, - "cache_read": 0.2, - "cache_write": 0.8 + "input": 0.14, + "output": 0.4 }, "type": "chat" }, { - "id": "mistralai/Magistral-Small-2506", - "name": "Magistral Small 2506", - "display_name": "Magistral Small 2506", + "id": "google/gemma-3-12b-it", + "name": "Gemma 3 12B", + "display_name": "Gemma 3 12B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "attachment": true, + "open_weights": true, + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 0.5, - "output": 1.5, - "cache_read": 0.25, - "cache_write": 1 + "input": 0.05, + "output": 0.1 }, "type": "chat" }, { - "id": "mistralai/Mistral-Large-Instruct-2411", - "name": "Mistral Large Instruct 2411", - "display_name": "Mistral Large Instruct 2411", + "id": "microsoft/wizardlm-2-8x22b", + "name": "Wizardlm 2 8x22B", + "display_name": "Wizardlm 2 8x22B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 65535, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "open_weights": true, + "release_date": "2024-04-24", + "last_updated": "2024-04-24", "cost": { - "input": 2, - "output": 6, - "cache_read": 1, - "cache_write": 4 + "input": 0.62, + "output": 0.62 }, "type": "chat" }, { - "id": "mistralai/Mistral-Nemo-Instruct-2407", - "name": "Mistral Nemo Instruct 2407", - "display_name": "Mistral Nemo Instruct 2407", + "id": "gryphe/mythomax-l2-13b", + "name": "Mythomax L2 13B", + "display_name": "Mythomax L2 13B", "modalities": { "input": [ "text" @@ -36922,31 +37899,28 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 4096, + "output": 3200 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-05", - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "release_date": "2024-04-25", + "last_updated": "2024-04-25", "cost": { - "input": 0.02, - "output": 0.04, - "cache_read": 0.01, - "cache_write": 0.04 + "input": 0.09, + "output": 0.09 }, "type": "chat" }, { - "id": "mistralai/Devstral-Small-2505", - "name": "Devstral Small 2505", - "display_name": "Devstral Small 2505", + "id": "deepseek/deepseek-r1-0528-qwen3-8b", + "name": "DeepSeek R1 0528 Qwen3 8B", + "display_name": "DeepSeek R1 0528 Qwen3 8B", "modalities": { "input": [ "text" @@ -36957,30 +37931,28 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", + "open_weights": true, + "release_date": "2025-05-29", + "last_updated": "2025-05-29", "cost": { - "input": 0.05, - "output": 0.22, - "cache_read": 0.025, - "cache_write": 0.1 + "input": 0.06, + "output": 0.09 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "deepseek/deepseek-prover-v2-671b", + "name": "Deepseek Prover V2 671B", + "display_name": "Deepseek Prover V2 671B", "modalities": { "input": [ "text" @@ -36990,66 +37962,60 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 160000, + "output": 160000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-04-30", + "last_updated": "2025-04-30", "cost": { - "input": 0.13, - "output": 0.38, - "cache_read": 0.065, - "cache_write": 0.26 + "input": 0.7, + "output": 2.5 }, "type": "chat" }, { - "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", - "name": "Llama 4 Maverick 17B 128E Instruct", - "display_name": "Llama 4 Maverick 17B 128E Instruct", + "id": "deepseek/deepseek-r1-turbo", + "name": "DeepSeek R1 (Turbo)\t", + "display_name": "DeepSeek R1 (Turbo)\t", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 430000, - "output": 4096 + "context": 64000, + "output": 16000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-15", - "last_updated": "2025-01-15", + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075, - "cache_write": 0.3 + "input": 0.7, + "output": 2.5 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.2-90B-Vision-Instruct", - "name": "Llama 3.2 90B Vision Instruct", - "display_name": "Llama 3.2 90B Vision Instruct", + "id": "deepseek/deepseek-ocr-2", + "name": "deepseek/deepseek-ocr-2", + "display_name": "deepseek/deepseek-ocr-2", "modalities": { "input": [ "text", @@ -37060,31 +38026,27 @@ ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.35, - "output": 0.4, - "cache_read": 0.175, - "cache_write": 0.7 + "input": 0.03, + "output": 0.03 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "deepseek/deepseek-v3.2-exp", + "name": "Deepseek V3.2 Exp", + "display_name": "Deepseek V3.2 Exp", "modalities": { "input": [ "text" @@ -37094,8 +38056,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -37103,34 +38065,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-28", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 2, - "output": 8.75, - "cache_read": 1, - "cache_write": 4 + "input": 0.27, + "output": 0.41 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT-OSS 20B", - "display_name": "GPT-OSS 20B", + "id": "deepseek/deepseek-r1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ "text" @@ -37140,36 +38088,42 @@ ] }, "limit": { - "context": 64000, - "output": 4096 + "context": 163840, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.03, - "output": 0.14, - "cache_read": 0.015, - "cache_write": 0.06 + "input": 0.7, + "output": 2.5, + "cache_read": 0.35 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT-OSS 120B", - "display_name": "GPT-OSS 120B", + "id": "deepseek/deepseek-v3-0324", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ "text" @@ -37179,36 +38133,30 @@ ] }, "limit": { - "context": 131072, - "output": 4096 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2024-07", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0.04, - "output": 0.4, - "cache_read": 0.02, - "cache_write": 0.08 + "input": 0.27, + "output": 1.12, + "cache_read": 0.135 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "deepseek/deepseek-v3.2", + "name": "Deepseek V3.2", + "display_name": "Deepseek V3.2", "modalities": { "input": [ "text" @@ -37218,8 +38166,8 @@ ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -37239,65 +38187,52 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "open_weights": true, + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.55, - "output": 2.25, - "cache_read": 0.275, - "cache_write": 1.1 + "input": 0.269, + "output": 0.4, + "cache_read": 0.1345 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "deepseek/deepseek-ocr", + "name": "DeepSeek-OCR", + "display_name": "DeepSeek-OCR", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-09-05", - "last_updated": "2024-09-05", + "attachment": true, + "open_weights": true, + "release_date": "2025-10-24", + "last_updated": "2025-10-24", "cost": { - "input": 0.39, - "output": 1.9, - "cache_read": 0.195, - "cache_write": 0.78 + "input": 0.03, + "output": 0.03 }, "type": "chat" - } - ] - }, - "alibaba-cn": { - "id": "alibaba-cn", - "name": "alibaba-cn", - "display_name": "alibaba-cn", - "api": "https://dashscope.aliyuncs.com/compatible-mode/v1", - "doc": "https://www.alibabacloud.com/help/en/model-studio/models", - "models": [ + }, { - "id": "qwen3-235b-a22b", - "name": "Qwen3 235B A22B", - "display_name": "Qwen3 235B A22B", + "id": "deepseek/deepseek-v3-turbo", + "name": "DeepSeek V3 (Turbo)\t", + "display_name": "DeepSeek V3 (Turbo)\t", "modalities": { "input": [ "text" @@ -37307,47 +38242,28 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 64000, + "output": 16000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "cost": { - "input": 0.287, - "output": 1.147, - "reasoning": 2.868 + "input": 0.4, + "output": 1.3 }, "type": "chat" }, { - "id": "qwen-plus-character", - "name": "Qwen Plus Character", - "display_name": "Qwen Plus Character", + "id": "deepseek/deepseek-r1-distill-qwen-14b", + "name": "DeepSeek R1 Distill Qwen 14B", + "display_name": "DeepSeek R1 Distill Qwen 14B", "modalities": { "input": [ "text" @@ -37358,28 +38274,27 @@ }, "limit": { "context": 32768, - "output": 4096 + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01", - "last_updated": "2024-01", + "open_weights": true, + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.115, - "output": 0.287 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "qwen2-5-math-7b-instruct", - "name": "Qwen2.5-Math 7B Instruct", - "display_name": "Qwen2.5-Math 7B Instruct", + "id": "deepseek/deepseek-v3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text" @@ -37389,75 +38304,67 @@ ] }, "limit": { - "context": 4096, - "output": 3072 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.144, - "output": 0.287 + "input": 0.27, + "output": 1, + "cache_read": 0.135 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Moonshot Kimi K2.5", - "display_name": "Moonshot Kimi K2.5", + "id": "deepseek/deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill LLama 70B", + "display_name": "DeepSeek R1 Distill LLama 70B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0.574, - "output": 2.411 + "input": 0.8, + "output": 0.8 }, "type": "chat" }, { - "id": "qwen-doc-turbo", - "name": "Qwen Doc Turbo", - "display_name": "Qwen Doc Turbo", + "id": "deepseek/deepseek-r1-distill-qwen-32b", + "name": "DeepSeek R1 Distill Qwen 32B", + "display_name": "DeepSeek R1 Distill Qwen 32B", "modalities": { "input": [ "text" @@ -37467,196 +38374,157 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 64000, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01", - "last_updated": "2024-01", + "open_weights": true, + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.087, - "output": 0.144 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen-vl-ocr", - "name": "Qwen Vl Ocr", - "display_name": "Qwen Vl Ocr", + "id": "deepseek/deepseek-v3.1-terminus", + "name": "Deepseek V3.1 Terminus", + "display_name": "Deepseek V3.1 Terminus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 34096, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-10-28", - "last_updated": "2025-04-13", + "open_weights": true, + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 0.717, - "output": 0.717 + "input": 0.27, + "output": 1, + "cache_read": 0.135 }, "type": "chat" }, { - "id": "qwen-omni-turbo-realtime", - "name": "Qwen-Omni Turbo Realtime", - "display_name": "Qwen-Omni Turbo Realtime", + "id": "minimaxai/minimax-m1-80k", + "name": "MiniMax M1", + "display_name": "MiniMax M1", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 1000000, + "output": 40000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-08", - "last_updated": "2025-05-08", + "open_weights": true, + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.23, - "output": 0.918, - "input_audio": 3.584, - "output_audio": 7.168 + "input": 0.55, + "output": 2.2 }, "type": "chat" }, { - "id": "qwen3-8b", - "name": "Qwen3 8B", - "display_name": "Qwen3 8B", + "id": "meta-llama/llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick Instruct", + "display_name": "Llama 4 Maverick Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 1048576, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "release_date": "2025-04-06", + "last_updated": "2025-04-06", "cost": { - "input": 0.072, - "output": 0.287, - "reasoning": 0.717 + "input": 0.27, + "output": 0.85 }, "type": "chat" }, { - "id": "qwen3.5-397b-a17b", - "name": "Qwen3.5 397B-A17B", - "display_name": "Qwen3.5 397B-A17B", + "id": "meta-llama/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout Instruct", + "display_name": "Llama 4 Scout Instruct", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "release_date": "2025-04-06", + "last_updated": "2025-04-06", "cost": { - "input": 0.43, - "output": 2.58, - "reasoning": 2.58 + "input": 0.18, + "output": 0.59 }, "type": "chat" }, { - "id": "qwen-math-turbo", - "name": "Qwen Math Turbo", - "display_name": "Qwen Math Turbo", + "id": "meta-llama/llama-3-70b-instruct", + "name": "Llama3 70B Instruct", + "display_name": "Llama3 70B Instruct", "modalities": { "input": [ "text" @@ -37666,29 +38534,28 @@ ] }, "limit": { - "context": 4096, - "output": 3072 + "context": 8192, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-09-19", - "last_updated": "2024-09-19", + "open_weights": true, + "release_date": "2024-04-25", + "last_updated": "2024-04-25", "cost": { - "input": 0.287, - "output": 0.861 + "input": 0.51, + "output": 0.74 }, "type": "chat" }, { - "id": "qwq-plus", - "name": "QwQ Plus", - "display_name": "QwQ Plus", + "id": "meta-llama/llama-3-8b-instruct", + "name": "Llama 3 8B Instruct", + "display_name": "Llama 3 8B Instruct", "modalities": { "input": [ "text" @@ -37698,56 +38565,31 @@ ] }, "limit": { - "context": 131072, + "context": 8192, "output": 8192 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 32768, - "min": 0, - "max": 32768 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-03-05", - "last_updated": "2025-03-05", + "open_weights": true, + "release_date": "2024-04-25", + "last_updated": "2024-04-25", "cost": { - "input": 0.23, - "output": 0.574 + "input": 0.04, + "output": 0.04 }, "type": "chat" }, { - "id": "qwen-vl-plus", - "name": "Qwen-VL Plus", - "display_name": "Qwen-VL Plus", + "id": "meta-llama/llama-3.3-70b-instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -37755,7 +38597,7 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 120000 }, "temperature": true, "tool_call": true, @@ -37763,20 +38605,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", - "last_updated": "2025-08-15", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-07", + "last_updated": "2024-12-07", "cost": { - "input": 0.115, - "output": 0.287 + "input": 0.135, + "output": 0.4 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "meta-llama/llama-3.2-3b-instruct", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ "text" @@ -37786,40 +38628,28 @@ ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 32768, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "open_weights": true, + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 0.86, - "output": 3.15 + "input": 0.03, + "output": 0.05 }, "type": "chat" }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "meta-llama/llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ "text" @@ -37829,34 +38659,28 @@ ] }, "limit": { - "context": 32768, + "context": 16384, "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "release_date": "2024-07-24", + "last_updated": "2024-07-24", "cost": { - "input": 0.287, - "output": 0.861 + "input": 0.02, + "output": 0.05 }, "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "xiaomimimo/mimo-v2-flash", + "name": "XiaomiMiMo/MiMo-V2-Flash", + "display_name": "XiaomiMiMo/MiMo-V2-Flash", "modalities": { "input": [ "text" @@ -37866,58 +38690,44 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "knowledge": "2024-12", + "release_date": "2025-12-19", + "last_updated": "2025-12-19", "cost": { - "input": 0.287, - "output": 1.147, - "reasoning": 2.868 + "input": 0.1, + "output": 0.3, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "baidu/ernie-4.5-vl-28b-a3b-thinking", + "name": "ERNIE-4.5-VL-28B-A3B-Thinking", + "display_name": "ERNIE-4.5-VL-28B-A3B-Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -37925,69 +38735,53 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2025-11-26", + "last_updated": "2025-11-26", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.39, + "output": 0.39 }, "type": "chat" }, { - "id": "qwen-max", - "name": "Qwen Max", - "display_name": "Qwen Max", + "id": "baidu/ernie-4.5-vl-424b-a47b", + "name": "ERNIE 4.5 VL 424B A47B", + "display_name": "ERNIE 4.5 VL 424B A47B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 123000, + "output": 16000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false - }, - "search": { "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-04-03", - "last_updated": "2025-01-25", + "attachment": true, + "open_weights": true, + "release_date": "2025-06-30", + "last_updated": "2025-06-30", "cost": { - "input": 0.345, - "output": 1.377 + "input": 0.42, + "output": 1.25 }, "type": "chat" }, { - "id": "qwen-plus", - "name": "Qwen Plus", - "display_name": "Qwen Plus", + "id": "baidu/ernie-4.5-21B-a3b-thinking", + "name": "ERNIE-4.5-21B-A3B-Thinking", + "display_name": "ERNIE-4.5-21B-A3B-Thinking", "modalities": { "input": [ "text" @@ -37997,68 +38791,41 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 131072, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", - "last_updated": "2025-09-11", + "open_weights": true, + "knowledge": "2025-03", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 0.115, - "output": 0.287, - "reasoning": 1.147 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "qwen-omni-turbo", - "name": "Qwen-Omni Turbo", - "display_name": "Qwen-Omni Turbo", + "id": "baidu/ernie-4.5-21B-a3b", + "name": "ERNIE 4.5 21B A3B", + "display_name": "ERNIE 4.5 21B A3B", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 120000, + "output": 8000 }, "temperature": true, "tool_call": true, @@ -38066,22 +38833,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-19", - "last_updated": "2025-03-26", + "open_weights": true, + "knowledge": "2025-03", + "release_date": "2025-06-30", + "last_updated": "2025-06-30", "cost": { - "input": 0.058, - "output": 0.23, - "input_audio": 3.584, - "output_audio": 7.168 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "qwen-flash", - "name": "Qwen Flash", - "display_name": "Qwen Flash", + "id": "baidu/ernie-4.5-300b-a47b-paddle", + "name": "ERNIE 4.5 300B A47B", + "display_name": "ERNIE 4.5 300B A47B", "modalities": { "input": [ "text" @@ -38091,52 +38856,28 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 123000, + "output": 12000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": true, + "release_date": "2025-06-30", + "last_updated": "2025-06-30", "cost": { - "input": 0.022, - "output": 0.216 + "input": 0.28, + "output": 1.1 }, "type": "chat" }, { - "id": "qwen2-5-vl-7b-instruct", - "name": "Qwen2.5-VL 7B Instruct", - "display_name": "Qwen2.5-VL 7B Instruct", + "id": "baidu/ernie-4.5-vl-28b-a3b", + "name": "ERNIE 4.5 VL 28B A3B", + "display_name": "ERNIE 4.5 VL 28B A3B", "modalities": { "input": [ "text", @@ -38147,40 +38888,42 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 30000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "release_date": "2025-06-30", + "last_updated": "2025-06-30", "cost": { - "input": 0.287, - "output": 0.717 + "input": 1.4, + "output": 5.6 }, "type": "chat" }, { - "id": "deepseek-r1", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "moonshotai/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -38199,33 +38942,33 @@ ] } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.574, - "output": 2.294 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "qwen3.5-flash", - "name": "Qwen3.5 Flash", - "display_name": "Qwen3.5 Flash", + "id": "deepseek/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, @@ -38244,35 +38987,33 @@ ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-23", - "last_updated": "2026-02-23", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.172, - "output": 1.72, - "reasoning": 1.72 + "input": 1.69, + "output": 3.38, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "deepseek/deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, @@ -38292,65 +39033,82 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.276, - "output": 1.651, - "cache_read": 0.028, - "cache_write": 0.344 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" - }, + } + ] + }, + "digitalocean": { + "id": "digitalocean", + "name": "DigitalOcean", + "display_name": "DigitalOcean", + "api": "https://inference.do-ai.run/v1", + "doc": "https://docs.digitalocean.com/products/gradient-ai-platform/details/models/", + "models": [ { - "id": "qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "openai-gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-30", "cost": { - "input": 0.861, - "output": 3.441 + "input": 5, + "output": 30, + "cache_read": 0.5, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + } }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "openai-o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" @@ -38360,168 +39118,146 @@ ] }, "limit": { - "context": 202752, - "output": 128000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-14", - "last_updated": "2026-04-14", + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 0.87, - "output": 3.48, - "cache_read": 0.17 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "qwen3-omni-flash", - "name": "Qwen3-Omni Flash", - "display_name": "Qwen3-Omni Flash", + "id": "bge-reranker-v2-m3", + "name": "BGE Reranker v2 M3", + "display_name": "BGE Reranker v2 M3", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 8192, + "output": 1 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "open_weights": true, + "release_date": "2024-03-12", + "last_updated": "2026-04-30", "cost": { - "input": 0.058, - "output": 0.23, - "input_audio": 3.584, - "output_audio": 7.168 + "input": 0.01, + "output": 0 }, - "type": "chat" + "type": "rerank" }, { - "id": "deepseek-v3-1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "openai-gpt-5-mini", + "name": "GPT-5 mini", + "display_name": "GPT-5 mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.574, - "output": 1.721 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "qwen2-5-72b-instruct", - "name": "Qwen2.5 72B Instruct", - "display_name": "Qwen2.5 72B Instruct", + "id": "openai-o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.574, - "output": 1.721 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b", - "name": "Qwen3-VL 235B-A22B", - "display_name": "Qwen3-VL 235B-A22B", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 262144, "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -38540,197 +39276,191 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-04-16", "cost": { - "input": 0.286705, - "output": 1.14682, - "reasoning": 2.867051 + "input": 0.5, + "output": 2.7 }, "type": "chat" }, { - "id": "qwen-math-plus", - "name": "Qwen Math Plus", - "display_name": "Qwen Math Plus", + "id": "anthropic-claude-4.5-haiku", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 3072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-08-16", - "last_updated": "2024-09-19", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.574, - "output": 1.721 + "input": 1, + "output": 5, + "cache_read": 1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "qwen2-5-coder-32b-instruct", - "name": "Qwen2.5-Coder 32B Instruct", - "display_name": "Qwen2.5-Coder 32B Instruct", + "id": "openai-gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-11", - "last_updated": "2024-11", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.287, - "output": 0.861 + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "qwen3-asr-flash", - "name": "Qwen3-ASR Flash", - "display_name": "Qwen3-ASR Flash", + "id": "llama3.3-70b-instruct", + "name": "Llama 3.3 Instruct 70B", + "display_name": "Llama 3.3 Instruct 70B", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 53248, - "output": 4096 + "context": 128000, + "output": 128000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-08", - "last_updated": "2025-09-08", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.032, - "output": 0.032 + "input": 0.65, + "output": 0.65 }, "type": "chat" }, { - "id": "qwen-deep-research", - "name": "Qwen Deep Research", - "display_name": "Qwen Deep Research", + "id": "nemotron-3-nano-omni", + "name": "Nemotron Nano 3 Omni", + "display_name": "Nemotron Nano 3 Omni", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01", - "last_updated": "2024-01", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-28", + "last_updated": "2026-04-30", "cost": { - "input": 7.742, - "output": 23.367 + "input": 0.5, + "output": 0.9 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "nemotron-nano-12b-v2-vl", + "name": "Nemotron Nano 12B v2 VL", + "display_name": "Nemotron Nano 12B v2 VL", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", + "knowledge": "2024-10", + "release_date": "2025-12-01", + "last_updated": "2026-04-30", "cost": { - "input": 0.144, - "output": 1.434 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "qwen-mt-plus", - "name": "Qwen Mt Plus", - "display_name": "Qwen Mt Plus", + "id": "mistral-7b-instruct-v0.3", + "name": "Mistral 7B Instruct v0.3", + "display_name": "Mistral 7B Instruct v0.3", "modalities": { "input": [ "text" @@ -38740,29 +39470,24 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01", - "last_updated": "2025-01", - "cost": { - "input": 0.259, - "output": 0.775 - }, + "open_weights": true, + "release_date": "2024-05-22", + "last_updated": "2024-05-22", "type": "chat" }, { - "id": "deepseek-r1-distill-qwen-32b", - "name": "DeepSeek R1 Distill Qwen 32B", - "display_name": "DeepSeek R1 Distill Qwen 32B", + "id": "nemotron-3-nano-30b", + "name": "Nemotron 3 Nano 30B A3B", + "display_name": "Nemotron 3 Nano 30B A3B", "modalities": { "input": [ "text" @@ -38772,8 +39497,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -38782,52 +39507,52 @@ "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0.287, - "output": 0.861 - }, + "open_weights": true, + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "type": "chat" }, { - "id": "qwen-vl-max", - "name": "Qwen-VL Max", - "display_name": "Qwen-VL Max", + "id": "anthropic-claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-04-08", - "last_updated": "2025-08-13", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.23, - "output": 0.574 + "input": 1, + "output": 5, + "cache_read": 1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "qwen3-coder-flash", - "name": "Qwen3 Coder Flash", - "display_name": "Qwen3 Coder Flash", + "id": "all-mini-lm-l6-v2", + "name": "All-MiniLM-L6-v2", + "display_name": "All-MiniLM-L6-v2", "modalities": { "input": [ "text" @@ -38837,157 +39562,178 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 256, + "output": 384 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": true, + "release_date": "2021-08-30", + "last_updated": "2026-04-16", "cost": { - "input": 0.144, - "output": 0.574 + "input": 0.009, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-r1-distill-qwen-7b", - "name": "DeepSeek R1 Distill Qwen 7B", - "display_name": "DeepSeek R1 Distill Qwen 7B", + "id": "openai-gpt-image-1", + "name": "GPT Image 1", + "display_name": "GPT Image 1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-04-24", + "last_updated": "2025-04-24", "cost": { - "input": 0.072, - "output": 0.144 + "input": 5, + "output": 40, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "qwen2-5-7b-instruct", - "name": "Qwen2.5 7B Instruct", - "display_name": "Qwen2.5 7B Instruct", + "id": "qwen3-tts-voicedesign", + "name": "Qwen3 TTS VoiceDesign", + "display_name": "Qwen3 TTS VoiceDesign", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32768, + "output": 1 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", - "cost": { - "input": 0.072, - "output": 0.144 - }, + "release_date": "2026-04-21", + "last_updated": "2026-04-30", "type": "chat" }, { - "id": "qwen2-5-14b-instruct", - "name": "Qwen2.5 14B Instruct", - "display_name": "Qwen2.5 14B Instruct", + "id": "openai-gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.144, - "output": 0.431 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "tongyi-intent-detect-v3", - "name": "Tongyi Intent Detect V3", - "display_name": "Tongyi Intent Detect V3", + "id": "anthropic-claude-4.5-sonnet", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1024 + "context": 1000000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01", - "last_updated": "2024-01", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.058, - "output": 0.144 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.3, + "cache_write": 3.75, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.3, + "cache_write": 3.75 + } }, "type": "chat" }, { - "id": "qwq-32b", - "name": "QwQ 32B", - "display_name": "QwQ 32B", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -38997,8 +39743,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, @@ -39019,127 +39765,136 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-12", - "last_updated": "2024-12", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.287, - "output": 0.861 + "input": 1.74, + "output": 3.48 }, "type": "chat" }, { - "id": "moonshot-kimi-k2-instruct", - "name": "Moonshot Kimi K2 Instruct", - "display_name": "Moonshot Kimi K2 Instruct", + "id": "anthropic-claude-4.1-opus", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.574, - "output": 2.294 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "qwen2-5-32b-instruct", - "name": "Qwen2.5 32B Instruct", - "display_name": "Qwen2.5 32B Instruct", + "id": "openai-gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, + "attachment": true, + "open_weights": false, "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.287, - "output": 0.861 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "openai-gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.144, - "output": 0.574 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen3-omni-flash-realtime", - "name": "Qwen3-Omni Flash Realtime", - "display_name": "Qwen3-Omni Flash Realtime", + "id": "mistral-nemo-instruct-2407", + "name": "Mistral Nemo Instruct", + "display_name": "Mistral Nemo Instruct", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 65536, + "context": 128000, "output": 16384 }, "temperature": true, @@ -39148,35 +39903,30 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "open_weights": true, + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.23, - "output": 0.918, - "input_audio": 3.584, - "output_audio": 7.168 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Moonshot Kimi K2.6", - "display_name": "Moonshot Kimi K2.6", + "id": "nvidia-nemotron-3-super-120b", + "name": "Nemotron-3-Super-120B", + "display_name": "Nemotron-3-Super-120B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 256000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -39184,44 +39934,32 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "knowledge": "2026-02", + "release_date": "2026-03-11", + "last_updated": "2026-04-16", "cost": { - "input": 0.929, - "output": 3.858 + "input": 0.3, + "output": 0.65 }, "type": "chat" }, { - "id": "qwen3-vl-30b-a3b", - "name": "Qwen3-VL 30B-A3B", - "display_name": "Qwen3-VL 30B-A3B", + "id": "arcee-trinity-large-thinking", + "name": "Trinity Large Thinking", + "display_name": "Trinity Large Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 256000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -39229,33 +39967,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-16", "cost": { - "input": 0.108, - "output": 0.431, - "reasoning": 1.076 + "input": 0.25, + "output": 0.9, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "qwen3-vl-plus", - "name": "Qwen3 VL Plus", - "display_name": "Qwen3 VL Plus", + "id": "anthropic-claude-3.5-sonnet", + "name": "Claude 3.5 Sonnet", + "display_name": "Claude 3.5 Sonnet", "modalities": { "input": [ "text", @@ -39266,142 +39992,136 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 200000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "knowledge": "2024-04", + "release_date": "2024-06-20", + "last_updated": "2024-10-22", "cost": { - "input": 0.143353, - "output": 1.433525, - "reasoning": 4.300576 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "deepseek-v3-2-exp", - "name": "DeepSeek V3.2 Exp", - "display_name": "DeepSeek V3.2 Exp", + "id": "openai-gpt-5.2-pro", + "name": "GPT-5.2 pro", + "display_name": "GPT-5.2 pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.287, - "output": 0.431 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "Qwen3-Coder 480B-A35B Instruct", - "display_name": "Qwen3-Coder 480B-A35B Instruct", + "id": "openai-gpt-5.4-nano", + "name": "GPT-5.4 nano", + "display_name": "GPT-5.4 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.861, - "output": 3.441 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "deepseek-r1-distill-qwen-1-5b", - "name": "DeepSeek R1 Distill Qwen 1.5B", - "display_name": "DeepSeek R1 Distill Qwen 1.5B", + "id": "openai-gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0, - "output": 0 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3-Coder 30B-A3B Instruct", - "display_name": "Qwen3-Coder 30B-A3B Instruct", + "id": "deepseek-v3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ "text" @@ -39411,8 +40131,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 163840, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -39421,19 +40141,15 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", - "cost": { - "input": 0.216, - "output": 0.861 - }, + "knowledge": "2024-07", + "release_date": "2024-12-26", + "last_updated": "2025-03-24", "type": "chat" }, { - "id": "qwen2-5-coder-7b-instruct", - "name": "Qwen2.5-Coder 7B Instruct", - "display_name": "Qwen2.5-Coder 7B Instruct", + "id": "minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -39443,29 +40159,35 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 204800, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-11", - "last_updated": "2024-11", + "knowledge": "2025-08", + "release_date": "2026-02-12", + "last_updated": "2026-04-16", "cost": { - "input": 0.144, - "output": 0.287 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "qwen-turbo", - "name": "Qwen Turbo", - "display_name": "Qwen Turbo", + "id": "qwen3.5-397b-a17b", + "name": "Qwen 3.5 397B A17B", + "display_name": "Qwen 3.5 397B A17B", "modalities": { "input": [ "text" @@ -39475,19 +40197,14 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 81920 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -39500,92 +40217,107 @@ ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-11-01", - "last_updated": "2025-07-15", + "open_weights": true, + "release_date": "2026-02-15", + "last_updated": "2026-04-30", "cost": { - "input": 0.044, - "output": 0.087, - "reasoning": 0.431 + "input": 0.55, + "output": 3.5 }, "type": "chat" }, { - "id": "qwen-mt-turbo", - "name": "Qwen Mt Turbo", - "display_name": "Qwen Mt Turbo", + "id": "ministral-3-8b-instruct-2512", + "name": "Ministral 3 8B", + "display_name": "Ministral 3 8B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-12-15", + "last_updated": "2025-12-15", + "type": "chat" + }, + { + "id": "openai-gpt-image-2", + "name": "GPT Image 2", + "display_name": "GPT Image 2", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01", - "last_updated": "2025-01", - "cost": { - "input": 0.101, - "output": 0.28 - }, + "release_date": "2025-04-24", + "last_updated": "2025-04-24", "type": "chat" }, { - "id": "qwen2-5-math-72b-instruct", - "name": "Qwen2.5-Math 72B Instruct", - "display_name": "Qwen2.5-Math 72B Instruct", + "id": "stable-diffusion-3.5-large", + "name": "Stable Diffusion 3.5 Large", + "display_name": "Stable Diffusion 3.5 Large", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 4096, - "output": 3072 + "context": 256, + "output": 1 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "release_date": "2024-10-22", + "last_updated": "2026-04-30", "cost": { - "input": 0.574, - "output": 1.721 + "input": 0.08, + "output": 0 }, "type": "chat" }, { - "id": "qwen3.6-max-preview", - "name": "Qwen3.6 Max Preview", - "display_name": "Qwen3.6 Max Preview", + "id": "qwen3-embedding-0.6b", + "name": "Qwen3 Embedding 0.6B", + "display_name": "Qwen3 Embedding 0.6B", "modalities": { "input": [ "text" @@ -39595,125 +40327,98 @@ ] }, "limit": { - "context": 245800, - "output": 65536 + "context": 8000, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-20", - "last_updated": "2026-04-21", + "open_weights": true, + "release_date": "2025-06-03", + "last_updated": "2026-04-16", "cost": { - "input": 1.32, - "output": 7.9, - "cache_read": 0.132 + "input": 0.04, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "qwen2-5-omni-7b", - "name": "Qwen2.5-Omni 7B", - "display_name": "Qwen2.5-Omni 7B", + "id": "openai-gpt-5-nano", + "name": "GPT-5 nano", + "display_name": "GPT-5 nano", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-12", - "last_updated": "2024-12", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.087, - "output": 0.345, - "input_audio": 5.448 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "qwen3.5-plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "openai-gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.573, - "output": 3.44, - "reasoning": 3.44 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "deepseek-r1-distill-qwen-14b", - "name": "DeepSeek R1 Distill Qwen 14B", - "display_name": "DeepSeek R1 Distill Qwen 14B", + "id": "deepseek-3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -39723,8 +40428,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -39732,20 +40437,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-12-02", + "last_updated": "2026-04-30", "cost": { - "input": 0.144, - "output": 0.431 + "input": 0.5, + "output": 1.6 }, "type": "chat" }, { - "id": "qwen2-5-vl-72b-instruct", - "name": "Qwen2.5-VL 72B Instruct", - "display_name": "Qwen2.5-VL 72B Instruct", + "id": "openai-gpt-5.4-pro", + "name": "GPT-5.4 pro", + "display_name": "GPT-5.4 pro", "modalities": { "input": [ "text", @@ -39756,29 +40473,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 2.294, - "output": 6.881 + "input": 30, + "output": 180 }, "type": "chat" }, { - "id": "deepseek-v3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "qwen3-coder-flash", + "name": "Qwen3 Coder Flash", + "display_name": "Qwen3 Coder Flash", "modalities": { "input": [ "text" @@ -39788,8 +40506,8 @@ ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -39797,19 +40515,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2026-04-30", "cost": { - "input": 0.287, - "output": 1.147 + "input": 0.45, + "output": 1.7 }, "type": "chat" }, { - "id": "deepseek-r1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", + "id": "openai-gpt-oss-20b", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ "text" @@ -39820,7 +40539,7 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -39828,31 +40547,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2025-08-05", + "last_updated": "2026-04-16", "cost": { - "input": 0.574, - "output": 2.294 + "input": 0.05, + "output": 0.45 }, "type": "chat" }, { - "id": "qvq-max", - "name": "QVQ Max", - "display_name": "QVQ Max", + "id": "openai-gpt-5.4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", "modalities": { "input": [ "text", @@ -39863,73 +40572,112 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 1.147, - "output": 4.588 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Moonshot Kimi K2 Thinking", - "display_name": "Moonshot Kimi K2 Thinking", + "id": "anthropic-claude-opus-4.6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.574, - "output": 2.294 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "tiers": [ + { + "input": 10, + "output": 37.5, + "cache_read": 0.5, + "cache_write": 6.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 0.5, + "cache_write": 6.25 + } }, "type": "chat" }, { - "id": "qwen3-14b", - "name": "Qwen3 14B", - "display_name": "Qwen3 14B", + "id": "alibaba-qwen3-32b", + "name": "Qwen3-32B", + "display_name": "Qwen3-32B", "modalities": { "input": [ "text" @@ -39939,79 +40687,117 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 131000, + "output": 40960 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "release_date": "2025-04-30", + "last_updated": "2026-04-16", "cost": { - "input": 0.144, - "output": 0.574, - "reasoning": 1.434 + "input": 0.25, + "output": 0.55 }, "type": "chat" }, { - "id": "deepseek-r1-distill-llama-8b", - "name": "DeepSeek R1 Distill Llama 8B", - "display_name": "DeepSeek R1 Distill Llama 8B", + "id": "gemma-4-31B-it", + "name": "Gemma 4 31B", + "display_name": "Gemma 4 31B", "modalities": { "input": [ + "text", + "image" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 256000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-04-22", + "last_updated": "2026-04-30", + "cost": { + "input": 0.18, + "output": 0.5 + }, + "type": "chat" + }, + { + "id": "anthropic-claude-3.7-sonnet", + "name": "Claude 3.7 Sonnet", + "display_name": "Claude 3.7 Sonnet", + "modalities": { + "input": [ + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2024-11", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "qwen-long", - "name": "Qwen Long", - "display_name": "Qwen Long", + "id": "llama3-8b-instruct", + "name": "Llama 3.1 Instruct (8B)", + "display_name": "Llama 3.1 Instruct (8B)", "modalities": { "input": [ "text" @@ -40021,76 +40807,90 @@ ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-25", - "last_updated": "2025-01-25", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.072, - "output": 0.287 + "input": 0.198, + "output": 0.198 }, "type": "chat" }, { - "id": "kimi/kimi-k2.5", - "name": "kimi/kimi-k2.5", - "display_name": "kimi/kimi-k2.5", + "id": "anthropic-claude-opus-4.7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], "interleaved": true, "summaries": true, - "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "MiniMax/MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "gte-large-en-v1.5", + "name": "GTE Large (v1.5)", + "display_name": "GTE Large (v1.5)", "modalities": { "input": [ "text" @@ -40100,73 +40900,83 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 8192, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2024-03-27", + "last_updated": "2026-04-16", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0.09, + "output": 0 }, "type": "chat" }, { - "id": "siliconflow/deepseek-v3-0324", - "name": "siliconflow/deepseek-v3-0324", - "display_name": "siliconflow/deepseek-v3-0324", + "id": "anthropic-claude-4.6-sonnet", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-26", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.25, - "output": 1 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.3, + "cache_write": 3.75, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.3, + "cache_write": 3.75 + } }, "type": "chat" }, { - "id": "siliconflow/deepseek-v3.2", - "name": "siliconflow/deepseek-v3.2", - "display_name": "siliconflow/deepseek-v3.2", + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ "text" @@ -40176,8 +40986,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -40191,30 +41001,32 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-03", - "last_updated": "2025-12-03", + "open_weights": true, + "release_date": "2025-01-30", + "last_updated": "2025-01-30", "cost": { - "input": 0.27, - "output": 0.42 + "input": 0.99, + "output": 0.99 }, "type": "chat" }, { - "id": "siliconflow/deepseek-r1-0528", - "name": "siliconflow/deepseek-r1-0528", - "display_name": "siliconflow/deepseek-r1-0528", + "id": "anthropic-claude-opus-4.5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -40222,31 +41034,23 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-11-25", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.5, - "output": 2.18 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "siliconflow/deepseek-v3.1-terminus", - "name": "siliconflow/deepseek-v3.1-terminus", - "display_name": "siliconflow/deepseek-v3.1-terminus", + "id": "multi-qa-mpnet-base-dot-v1", + "name": "Multi-QA-mpnet-base-dot-v1", + "display_name": "Multi-QA-mpnet-base-dot-v1", "modalities": { "input": [ "text" @@ -40256,29 +41060,28 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 512, + "output": 768 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2021-08-30", + "last_updated": "2026-04-16", "cost": { - "input": 0.27, - "output": 1 + "input": 0.009, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "qwen-2.5-14b-instruct", + "name": "Qwen 2.5 14B Instruct", + "display_name": "Qwen 2.5 14B Instruct", "modalities": { "input": [ "text" @@ -40288,8 +41091,8 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -40298,19 +41101,15 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", - "cost": { - "input": 1, - "output": 5 - }, + "knowledge": "2024-09", + "release_date": "2024-09-19", + "last_updated": "2024-09-19", "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "e5-large-v2", + "name": "E5 Large v2", + "display_name": "E5 Large v2", "modalities": { "input": [ "text" @@ -40320,53 +41119,41 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 512, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2023-05-19", + "last_updated": "2026-04-30", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 0.02, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "anthropic-claude-opus-4", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -40374,60 +41161,60 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "qwen3-coder-plus-2025-09-23", - "name": "Qwen3 Coder Plus 2025 09 23", - "display_name": "Qwen3 Coder Plus 2025 09 23", + "id": "openai-gpt-image-1.5", + "name": "GPT Image 1.5", + "display_name": "GPT Image 1.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-25", + "last_updated": "2025-11-25", + "cost": { + "input": 5, + "output": 10, + "cache_read": 1 + }, "type": "chat" }, { - "id": "qwen3-coder-plus-2025-07-22", - "name": "Qwen3 Coder Plus 2025 07 22", - "display_name": "Qwen3 Coder Plus 2025 07 22", + "id": "llama-4-maverick", + "name": "Llama 4 Maverick 17B 128E Instruct", + "display_name": "Llama 4 Maverick 17B 128E Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -40435,123 +41222,186 @@ }, "limit": { "context": 1000000, - "output": 65536 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2026-04-30", + "cost": { + "input": 0.25, + "output": 0.87 + }, "type": "chat" }, { - "id": "qwen-vl-ocr-latest", - "name": "Qwen Vl Ocr Latest", - "display_name": "Qwen Vl Ocr Latest", + "id": "openai-gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 34096, - "output": 4096 + "context": 1000000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", + "cost": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, - "attachment": false, "type": "chat" }, { - "id": "qvq-max-2025-05-15", - "name": "Qvq Max 2025 05 15", - "display_name": "Qvq Max 2025 05 15", + "id": "anthropic-claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 16384, - "min": 0, - "max": 16384 + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.3, + "cache_write": 3.75, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.3, + "cache_write": 3.75 } }, - "attachment": false, "type": "chat" }, { - "id": "qwen-turbo-latest", - "name": "Qwen Turbo Latest", - "display_name": "Qwen Turbo Latest", + "id": "openai-o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", + "cost": { + "input": 15, + "output": 60, + "cache_read": 7.5 }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "type": "chat" + }, + { + "id": "wan2-2-t2v-a14b", + "name": "Wan2.2-T2V-A14B", + "display_name": "Wan2.2-T2V-A14B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "video" + ] + }, + "limit": { + "context": 100, + "output": 1 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false }, "attachment": false, + "open_weights": true, + "release_date": "2025-07-28", + "last_updated": "2026-04-30", + "cost": { + "input": 0.6, + "output": 0 + }, "type": "chat" }, { - "id": "qwen-turbo-2024-09-19", - "name": "Qwen Turbo 2024 09 19", - "display_name": "Qwen Turbo 2024 09 19", + "id": "anthropic-claude-3.5-haiku", + "name": "Claude 3.5 Haiku", + "display_name": "Claude 3.5 Haiku", "modalities": { "input": [ "text" @@ -40561,7 +41411,7 @@ ] }, "limit": { - "context": 131072, + "context": 200000, "output": 8192 }, "temperature": true, @@ -40570,12 +41420,22 @@ "supported": false }, "attachment": false, + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-11-05", + "last_updated": "2024-11-05", + "cost": { + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 + }, "type": "chat" }, { - "id": "qwen-flash-2025-07-28", - "name": "Qwen Flash 2025 07 28", - "display_name": "Qwen Flash 2025 07 28", + "id": "bge-m3", + "name": "BGE M3", + "display_name": "BGE M3", "modalities": { "input": [ "text" @@ -40585,115 +41445,129 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 8192, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2024-01-30", + "last_updated": "2026-04-30", + "cost": { + "input": 0.02, + "output": 0 }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "type": "embedding" + }, + { + "id": "mistral-3-14B", + "name": "Ministral 3 14B Instruct", + "display_name": "Ministral 3 14B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, "attachment": false, + "open_weights": true, + "release_date": "2025-12-15", + "last_updated": "2026-04-30", + "cost": { + "input": 0.2, + "output": 0.2 + }, "type": "chat" }, { - "id": "qwen-plus-latest", - "name": "Qwen Plus Latest", - "display_name": "Qwen Plus Latest", + "id": "openai-gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", + "cost": { + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, - "attachment": false, "type": "chat" }, { - "id": "qwen-plus-2024-09-19", - "name": "Qwen Plus 2024 09 19", - "display_name": "Qwen Plus 2024 09 19", + "id": "anthropic-claude-3-opus", + "name": "Claude 3 Opus", + "display_name": "Claude 3 Opus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, + "open_weights": false, + "knowledge": "2023-08", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", + "cost": { + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + }, "type": "chat" }, { - "id": "qwen-plus-2025-07-14", - "name": "Qwen Plus 2025 07 14", - "display_name": "Qwen Plus 2025 07 14", + "id": "glm-5", + "name": "GLM 5", + "display_name": "GLM 5", "modalities": { "input": [ "text" @@ -40703,19 +41577,13 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 202752, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -40728,41 +41596,38 @@ ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-04-16", + "cost": { + "input": 1, + "output": 3.2 + }, "type": "chat" }, { - "id": "qwen-plus-2025-09-11", - "name": "Qwen Plus 2025 09 11", - "display_name": "Qwen Plus 2025 09 11", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -40775,19 +41640,21 @@ ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", + "cost": { + "input": 0.95, + "output": 4 }, - "attachment": false, "type": "chat" }, { - "id": "qwen-max-latest", - "name": "Qwen Max Latest", - "display_name": "Qwen Max Latest", + "id": "openai-gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ "text" @@ -40798,137 +41665,162 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "search": { "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2025-08-05", + "last_updated": "2026-04-16", + "cost": { + "input": 0.1, + "output": 0.7 + }, "type": "chat" }, { - "id": "qwen-max-2024-09-19", - "name": "Qwen Max 2024 09 19", - "display_name": "Qwen Max 2024 09 19", + "id": "fal-ai/fast-sdxl", + "name": "Fast SDXL", + "display_name": "Fast SDXL", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 32768, + "context": 8192, "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, + "open_weights": true, + "release_date": "2023-07-26", + "last_updated": "2026-04-16", "type": "chat" }, { - "id": "qwen-max-2024-04-28", - "name": "Qwen Max 2024 04 28", - "display_name": "Qwen Max 2024 04 28", + "id": "fal-ai/flux/schnell", + "name": "FLUX.1 [schnell]", + "display_name": "FLUX.1 [schnell]", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, + "open_weights": true, + "release_date": "2024-08-01", + "last_updated": "2026-04-16", "type": "chat" }, { - "id": "qwen-max-2024-04-03", - "name": "Qwen Max 2024 04 03", - "display_name": "Qwen Max 2024 04 03", - "modalities": { - "input": [ + "id": "fal-ai/elevenlabs/tts/multilingual-v2", + "name": "ElevenLabs Multilingual TTS v2", + "display_name": "ElevenLabs Multilingual TTS v2", + "modalities": { + "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2023-08-22", + "last_updated": "2026-04-16", "type": "chat" }, { - "id": "qwen-max-2025-01-25", - "name": "Qwen Max 2025 01 25", - "display_name": "Qwen Max 2025 01 25", + "id": "fal-ai/stable-audio-25/text-to-audio", + "name": "Stable Audio 2.5 (Text-to-Audio)", + "display_name": "Stable Audio 2.5 (Text-to-Audio)", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 131072, + "context": 8192, "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, + "open_weights": false, + "release_date": "2025-10-08", + "last_updated": "2026-04-16", "type": "chat" - }, + } + ] + }, + "moonshot-ai": { + "id": "moonshot-ai", + "name": "Moonshot AI", + "display_name": "Moonshot AI", + "api": "https://api.moonshot.ai/v1", + "doc": "https://platform.moonshot.ai/docs/api/chat", + "models": [ { - "id": "qwen3-max-2025-09-23", - "name": "Qwen3 Max 20250923", - "display_name": "Qwen3 Max 20250923", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -40936,26 +41828,41 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false - }, - "search": { "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", + "cost": { + "input": 0.6, + "output": 3, + "cache_read": 0.1 + }, "type": "chat" }, { - "id": "qwen3-max-preview", - "name": "Qwen3 Max Preview", - "display_name": "Qwen3 Max Preview", + "id": "kimi-k2-0905-preview", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -40966,37 +41873,29 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "supported": false }, "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "cost": { + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + }, "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -41006,19 +41905,14 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -41032,36 +41926,21 @@ } }, "attachment": false, - "type": "chat" - }, - { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "cost": { + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, - "attachment": false, "type": "chat" }, { - "id": "qwen3-30b-a3b-instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", + "id": "kimi-k2-0711-preview", + "name": "Kimi K2 0711", + "display_name": "Kimi K2 0711", "modalities": { "input": [ "text" @@ -41072,7 +41951,7 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -41080,12 +41959,21 @@ "supported": false }, "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", + "cost": { + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b-thinking-2507", - "name": "Qwen3 30B A3B Thinking 2507", - "display_name": "Qwen3 30B A3B Thinking 2507", + "id": "kimi-k2-thinking-turbo", + "name": "Kimi K2 Thinking Turbo", + "display_name": "Kimi K2 Thinking Turbo", "modalities": { "input": [ "text" @@ -41095,19 +41983,14 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -41121,34 +42004,40 @@ } }, "attachment": false, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "cost": { + "input": 1.15, + "output": 8, + "cache_read": 0.15 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -41161,13 +42050,22 @@ ] } }, - "attachment": false, + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", + "cost": { + "input": 0.95, + "output": 4, + "cache_read": 0.16 + }, "type": "chat" }, { - "id": "qwen3-4b", - "name": "Qwen3 4B", - "display_name": "Qwen3 4B", + "id": "kimi-k2-turbo-preview", + "name": "Kimi K2 Turbo", + "display_name": "Kimi K2 Turbo", "modalities": { "input": [ "text" @@ -41177,162 +42075,136 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "cost": { + "input": 2.4, + "output": 10, + "cache_read": 0.6 + }, "type": "chat" - }, + } + ] + }, + "mistral": { + "id": "mistral", + "name": "Mistral", + "display_name": "Mistral", + "doc": "https://docs.mistral.ai/getting-started/models/", + "models": [ { - "id": "qwen3-1.7b", - "name": "Qwen3 1.7B", - "display_name": "Qwen3 1.7B", + "id": "mistral-medium-2604", + "name": "Mistral Medium 3.5", + "display_name": "Mistral Medium 3.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 30720, - "min": 0, - "max": 30720 - } + "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": true, + "open_weights": true, + "release_date": "2026-04-29", + "last_updated": "2026-04-29", + "cost": { + "input": 1.5, + "output": 7.5 }, - "attachment": false, "type": "chat" }, { - "id": "qwen3-0.6b", - "name": "Qwen3 0.6B", - "display_name": "Qwen3 0.6B", + "id": "mistral-large-2512", + "name": "Mistral Large 3", + "display_name": "Mistral Large 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 30720, - "min": 0, - "max": 30720 - } + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": true, + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", + "cost": { + "input": 0.5, + "output": 1.5 }, - "attachment": false, "type": "chat" }, { - "id": "qwen3-vl-plus-2025-09-23", - "name": "Qwen3 VL Plus 2025 09 23", - "display_name": "Qwen3 VL Plus 2025 09 23", + "id": "ministral-3b-latest", + "name": "Ministral 3B (latest)", + "display_name": "Ministral 3B (latest)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-04", + "cost": { + "input": 0.04, + "output": 0.04 + }, "type": "chat" }, { - "id": "qwq-plus-latest", - "name": "QwQ Plus Latest", - "display_name": "QwQ Plus Latest", + "id": "mistral-large-2411", + "name": "Mistral Large 2.1", + "display_name": "Mistral Large 2.1", "modalities": { "input": [ "text" @@ -41343,49 +42215,28 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 32768, - "min": 0, - "max": 32768 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "search": { "supported": false }, "attachment": false, + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2024-11-04", + "cost": { + "input": 2, + "output": 6 + }, "type": "chat" - } - ] - }, - "firepass": { - "id": "firepass", - "name": "Fireworks (Firepass)", - "display_name": "Fireworks (Firepass)", - "api": "https://api.fireworks.ai/inference/v1/", - "doc": "https://docs.fireworks.ai/firepass", - "models": [ + }, { - "id": "accounts/fireworks/routers/kimi-k2p6-turbo", - "name": "Kimi K2.6 Turbo", - "display_name": "Kimi K2.6 Turbo", + "id": "pixtral-12b", + "name": "Pixtral 12B", + "display_name": "Pixtral 12B", "modalities": { "input": [ "text", @@ -41396,50 +42247,29 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "knowledge": "2024-09", + "release_date": "2024-09-01", + "last_updated": "2024-09-01", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.15, + "output": 0.15 }, "type": "chat" - } - ] - }, - "minimax-cn-coding-plan": { - "id": "minimax-cn-coding-plan", - "name": "MiniMax Coding Plan (minimaxi.com)", - "display_name": "MiniMax Coding Plan (minimaxi.com)", - "api": "https://api.minimaxi.com/anthropic/v1", - "doc": "https://platform.minimaxi.com/docs/coding-plan/intro", - "models": [ + }, { - "id": "MiniMax-M2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "codestral-latest", + "name": "Codestral (latest)", + "display_name": "Codestral (latest)", "modalities": { "input": [ "text" @@ -41449,34 +42279,29 @@ ] }, "limit": { - "context": 196608, - "output": 128000 + "context": 256000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "knowledge": "2024-10", + "release_date": "2024-05-29", + "last_updated": "2025-01-04", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "open-mixtral-8x22b", + "name": "Mixtral 8x22B", + "display_name": "Mixtral 8x22B", "modalities": { "input": [ "text" @@ -41486,47 +42311,41 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 64000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2024-04", + "release_date": "2024-04-17", + "last_updated": "2024-04-17", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "mistral-small-latest", + "name": "Mistral Small (latest)", + "display_name": "Mistral Small (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -41534,44 +42353,33 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-06", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "MiniMax-M2.7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "mistral-small-2603", + "name": "Mistral Small 4", + "display_name": "Mistral Small 4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -41579,33 +42387,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-06", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -41615,34 +42411,29 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2024-07", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0, - "output": 0 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "MiniMax-M2.5-highspeed", - "name": "MiniMax-M2.5-highspeed", - "display_name": "MiniMax-M2.5-highspeed", + "id": "open-mistral-7b", + "name": "Mistral 7B", + "display_name": "Mistral 7B", "modalities": { "input": [ "text" @@ -41652,83 +42443,62 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 8000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-13", - "last_updated": "2026-02-13", + "knowledge": "2023-12", + "release_date": "2023-09-27", + "last_updated": "2023-09-27", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.25, + "output": 0.25 }, "type": "chat" - } - ] - }, - "bailing": { - "id": "bailing", - "name": "Bailing", - "display_name": "Bailing", - "api": "https://api.tbox.cn/api/llm/v1/chat/completions", - "doc": "https://alipaytbox.yuque.com/sxs0ba/ling/intro", - "models": [ + }, { - "id": "Ring-1T", - "name": "Ring-1T", - "display_name": "Ring-1T", + "id": "mistral-medium-2508", + "name": "Mistral Medium 3.1", + "display_name": "Mistral Medium 3.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-10", - "last_updated": "2025-10", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-08-12", + "last_updated": "2025-08-12", "cost": { - "input": 0.57, - "output": 2.29 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "Ling-1T", - "name": "Ling-1T", - "display_name": "Ling-1T", + "id": "devstral-medium-2507", + "name": "Devstral Medium", + "display_name": "Devstral Medium", "modalities": { "input": [ "text" @@ -41739,7 +42509,7 @@ }, "limit": { "context": 128000, - "output": 32000 + "output": 128000 }, "temperature": true, "tool_call": true, @@ -41748,28 +42518,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-10", - "last_updated": "2025-10", + "knowledge": "2025-05", + "release_date": "2025-07-10", + "last_updated": "2025-07-10", "cost": { - "input": 0.57, - "output": 2.29 + "input": 0.4, + "output": 2 }, "type": "chat" - } - ] - }, - "iflowcn": { - "id": "iflowcn", - "name": "iFlow", - "display_name": "iFlow", - "api": "https://apis.iflow.cn/v1", - "doc": "https://platform.iflow.cn/en/docs", - "models": [ + }, { - "id": "qwen3-coder-plus", - "name": "Qwen3-Coder-Plus", - "display_name": "Qwen3-Coder-Plus", + "id": "devstral-small-2505", + "name": "Devstral Small 2505", + "display_name": "Devstral Small 2505", "modalities": { "input": [ "text" @@ -41779,8 +42540,8 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -41789,19 +42550,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3-32B", - "display_name": "Qwen3-32B", + "id": "devstral-2512", + "name": "Devstral 2", + "display_name": "Devstral 2", "modalities": { "input": [ "text" @@ -41811,40 +42572,29 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "cost": { - "input": 0, - "output": 0 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "magistral-medium-latest", + "name": "Magistral Medium (latest)", + "display_name": "Magistral Medium (latest)", "modalities": { "input": [ "text" @@ -41855,7 +42605,7 @@ }, "limit": { "context": 128000, - "output": 32000 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -41863,32 +42613,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2025-06", + "release_date": "2025-03-17", + "last_updated": "2025-03-20", "cost": { - "input": 0, - "output": 0 + "input": 2, + "output": 5 }, "type": "chat" }, { - "id": "qwen3-max", - "name": "Qwen3-Max", - "display_name": "Qwen3-Max", + "id": "magistral-small", + "name": "Magistral Small", + "display_name": "Magistral Small", "modalities": { "input": [ "text" @@ -41898,40 +42637,30 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-03-17", + "last_updated": "2025-03-17", "cost": { - "input": 0, - "output": 0 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct", - "name": "Qwen3-235B-A22B-Instruct", - "display_name": "Qwen3-235B-A22B-Instruct", + "id": "devstral-small-2507", + "name": "Devstral Small", + "display_name": "Devstral Small", "modalities": { "input": [ "text" @@ -41941,8 +42670,8 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -41951,63 +42680,52 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "knowledge": "2025-05", + "release_date": "2025-07-10", + "last_updated": "2025-07-10", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen3-235B-A22B-Thinking", - "display_name": "Qwen3-235B-A22B-Thinking", + "id": "mistral-medium-2505", + "name": "Mistral Medium 3", + "display_name": "Mistral Medium 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0, - "output": 0 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "kimi-k2-0905", - "name": "Kimi-K2-0905", - "display_name": "Kimi-K2-0905", + "id": "devstral-medium-latest", + "name": "Devstral 2 (latest)", + "display_name": "Devstral 2 (latest)", "modalities": { "input": [ "text" @@ -42017,8 +42735,8 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -42026,58 +42744,53 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0, - "output": 0 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "mistral-small-2506", + "name": "Mistral Small 3.2", + "display_name": "Mistral Small 3.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2025-11-13", + "open_weights": true, + "knowledge": "2025-03", + "release_date": "2025-06-20", + "last_updated": "2025-06-20", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen3-vl-plus", - "name": "Qwen3-VL-Plus", - "display_name": "Qwen3-VL-Plus", + "id": "mistral-large-latest", + "name": "Mistral Large (latest)", + "display_name": "Mistral Large (latest)", "modalities": { "input": [ "text", @@ -42088,67 +42801,52 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", "cost": { - "input": 0, - "output": 0 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek-V3.2-Exp", - "display_name": "DeepSeek-V3.2-Exp", + "id": "labs-devstral-small-2512", + "name": "Devstral Small 2", + "display_name": "Devstral Small 2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "cost": { "input": 0, "output": 0 @@ -42156,9 +42854,9 @@ "type": "chat" }, { - "id": "qwen3-235b", - "name": "Qwen3-235B-A22B", - "display_name": "Qwen3-235B-A22B", + "id": "mistral-embed", + "name": "Mistral Embed", + "display_name": "Mistral Embed", "modalities": { "input": [ "text" @@ -42168,30 +42866,28 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 8000, + "output": 3072 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": false, + "release_date": "2023-12-11", + "last_updated": "2023-12-11", "cost": { - "input": 0, + "input": 0.1, "output": 0 }, "type": "chat" }, { - "id": "kimi-k2", - "name": "Kimi-K2", - "display_name": "Kimi-K2", + "id": "open-mixtral-8x7b", + "name": "Mixtral 8x7B", + "display_name": "Mixtral 8x7B", "modalities": { "input": [ "text" @@ -42201,8 +42897,8 @@ ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 32000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -42210,20 +42906,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "knowledge": "2024-01", + "release_date": "2023-12-11", + "last_updated": "2023-12-11", "cost": { - "input": 0, - "output": 0 + "input": 0.7, + "output": 0.7 }, "type": "chat" }, { - "id": "qwen3-max-preview", - "name": "Qwen3-Max-Preview", - "display_name": "Qwen3-Max-Preview", + "id": "ministral-8b-latest", + "name": "Ministral 8B (latest)", + "display_name": "Ministral 8B (latest)", "modalities": { "input": [ "text" @@ -42233,43 +42929,33 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-04", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "deepseek-v3", - "name": "DeepSeek-V3", - "display_name": "DeepSeek-V3", + "id": "pixtral-large-latest", + "name": "Pixtral Large (latest)", + "display_name": "Pixtral Large (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -42277,36 +42963,28 @@ }, "limit": { "context": 128000, - "output": 32000 + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-26", - "last_updated": "2024-12-26", + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2024-11-04", "cost": { - "input": 0, - "output": 0 + "input": 2, + "output": 6 }, "type": "chat" - } - ] - }, - "v0": { - "id": "v0", - "name": "v0", - "display_name": "v0", - "doc": "https://sdk.vercel.ai/providers/ai-sdk-providers/vercel", - "models": [ + }, { - "id": "v0-1.5-lg", - "name": "v0-1.5-lg", - "display_name": "v0-1.5-lg", + "id": "mistral-medium-latest", + "name": "Mistral Medium (latest)", + "display_name": "Mistral Medium (latest)", "modalities": { "input": [ "text", @@ -42317,8 +42995,8 @@ ] }, "limit": { - "context": 512000, - "output": 32000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -42327,31 +43005,39 @@ "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2025-06-09", - "last_updated": "2025-06-09", + "open_weights": true, + "release_date": "2026-04-29", + "last_updated": "2026-04-29", "cost": { - "input": 15, - "output": 75 + "input": 1.5, + "output": 7.5 }, "type": "chat" - }, + } + ] + }, + "kilo": { + "id": "kilo", + "name": "Kilo Gateway", + "display_name": "Kilo Gateway", + "api": "https://api.kilo.ai/api/gateway", + "doc": "https://kilo.ai", + "models": [ { - "id": "v0-1.0-md", - "name": "v0-1.0-md", - "display_name": "v0-1.0-md", + "id": "prime-intellect/intellect-3", + "name": "Prime Intellect: INTELLECT-3", + "display_name": "Prime Intellect: INTELLECT-3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -42359,74 +43045,93 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "release_date": "2025-11-26", + "last_updated": "2026-02-04", "cost": { - "input": 3, - "output": 15 + "input": 0.2, + "output": 1.1 }, "type": "chat" }, { - "id": "v0-1.5-md", - "name": "v0-1.5-md", - "display_name": "v0-1.5-md", + "id": "liquid/lfm-2-24b-a2b", + "name": "LiquidAI: LFM2-24B-A2B", + "display_name": "LiquidAI: LFM2-24B-A2B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-09", - "last_updated": "2025-06-09", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-26", + "last_updated": "2026-03-15", "cost": { - "input": 3, - "output": 15 + "input": 0.03, + "output": 0.12 }, "type": "chat" - } - ] - }, - "huggingface": { - "id": "huggingface", - "name": "Hugging Face", - "display_name": "Hugging Face", - "api": "https://router.huggingface.co/v1", - "doc": "https://huggingface.co/docs/inference-providers", - "models": [ + }, { - "id": "Qwen/Qwen3.5-397B-A17B", - "name": "Qwen3.5-397B-A17B", - "display_name": "Qwen3.5-397B-A17B", + "id": "undi95/remm-slerp-l2-13b", + "name": "ReMM SLERP 13B", + "display_name": "ReMM SLERP 13B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 6144, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-07-22", + "last_updated": "2026-03-15", + "cost": { + "input": 0.45, + "output": 0.65 + }, + "type": "chat" + }, + { + "id": "inception/mercury-2", + "name": "Inception: Mercury 2", + "display_name": "Inception: Mercury 2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 50000 }, "temperature": true, "tool_call": true, @@ -42434,32 +43139,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-01", - "last_updated": "2026-02-01", + "attachment": false, + "open_weights": false, + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0.6, - "output": 3.6 + "input": 0.25, + "output": 0.75, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-Next", - "name": "Qwen3-Coder-Next", - "display_name": "Qwen3-Coder-Next", + "id": "sao10k/l3.1-70b-hanami-x1", + "name": "Sao10K: Llama 3.1 70B Hanami x1", + "display_name": "Sao10K: Llama 3.1 70B Hanami x1", "modalities": { "input": [ "text" @@ -42469,29 +43163,28 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 16000, + "output": 16000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-03", - "last_updated": "2026-02-03", + "release_date": "2025-01-08", + "last_updated": "2026-03-15", "cost": { - "input": 0.2, - "output": 1.5 + "input": 3, + "output": 3 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "name": "Qwen3-Next-80B-A3B-Instruct", - "display_name": "Qwen3-Next-80B-A3B-Instruct", + "id": "sao10k/l3.1-euryale-70b", + "name": "Sao10K: Llama 3.1 Euryale 70B v2.2", + "display_name": "Sao10K: Llama 3.1 Euryale 70B v2.2", "modalities": { "input": [ "text" @@ -42501,8 +43194,8 @@ ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -42511,19 +43204,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-11", - "last_updated": "2025-09-11", + "release_date": "2024-08-28", + "last_updated": "2026-03-15", "cost": { - "input": 0.25, - "output": 1 + "input": 0.85, + "output": 0.85 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Embedding-8B", - "name": "Qwen 3 Embedding 8B", - "display_name": "Qwen 3 Embedding 8B", + "id": "sao10k/l3-lunaris-8b", + "name": "Sao10K: Llama 3 8B Lunaris", + "display_name": "Sao10K: Llama 3 8B Lunaris", "modalities": { "input": [ "text" @@ -42533,29 +43225,28 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 8192, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2024-08-13", + "last_updated": "2026-03-15", "cost": { - "input": 0.01, - "output": 0 + "input": 0.04, + "output": 0.05 }, - "type": "embedding" + "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen3-235B-A22B-Thinking-2507", + "id": "sao10k/l3-euryale-70b", + "name": "Sao10k: Llama 3 Euryale 70B v2.1", + "display_name": "Sao10k: Llama 3 Euryale 70B v2.1", "modalities": { "input": [ "text" @@ -42565,41 +43256,28 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "release_date": "2024-06-18", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 3 + "input": 1.48, + "output": 1.48 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "name": "Qwen3-Next-80B-A3B-Thinking", - "display_name": "Qwen3-Next-80B-A3B-Thinking", + "id": "sao10k/l3.3-euryale-70b", + "name": "Sao10K: Llama 3.3 Euryale 70B", + "display_name": "Sao10K: Llama 3.3 Euryale 70B", "modalities": { "input": [ "text" @@ -42609,40 +43287,28 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 131072, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-11", - "last_updated": "2025-09-11", + "release_date": "2024-12-18", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 2 + "input": 0.65, + "output": 0.75 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Embedding-4B", - "name": "Qwen 3 Embedding 4B", - "display_name": "Qwen 3 Embedding 4B", + "id": "ibm-granite/granite-4.0-h-micro", + "name": "IBM: Granite 4.0 Micro", + "display_name": "IBM: Granite 4.0 Micro", "modalities": { "input": [ "text" @@ -42652,29 +43318,28 @@ ] }, "limit": { - "context": 32000, - "output": 2048 + "context": 131000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-10-20", + "last_updated": "2026-03-15", "cost": { - "input": 0.01, - "output": 0 + "input": 0.017, + "output": 0.11 }, - "type": "embedding" + "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen3-Coder-480B-A35B-Instruct", - "display_name": "Qwen3-Coder-480B-A35B-Instruct", + "id": "ibm-granite/granite-4.1-8b", + "name": "IBM: Granite 4.1 8B", + "display_name": "IBM: Granite 4.1 8B", "modalities": { "input": [ "text" @@ -42684,8 +43349,8 @@ ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -42693,20 +43358,20 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "release_date": "2026-04-30", + "last_updated": "2026-05-01", "cost": { - "input": 2, - "output": 2 + "input": 0.05, + "output": 0.1, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7-Flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "cohere/command-r-08-2024", + "name": "Cohere: Command R (08-2024)", + "display_name": "Cohere: Command R (08-2024)", "modalities": { "input": [ "text" @@ -42716,41 +43381,28 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0, - "output": 0 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "cohere/command-r-plus-08-2024", + "name": "Cohere: Command R+ (08-2024)", + "display_name": "Cohere: Command R+ (08-2024)", "modalities": { "input": [ "text" @@ -42760,42 +43412,28 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "cohere/command-r7b-12-2024", + "name": "Cohere: Command R7B (12-2024)", + "display_name": "Cohere: Command R7B (12-2024)", "modalities": { "input": [ "text" @@ -42805,41 +43443,28 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-04-03", - "last_updated": "2026-04-03", + "release_date": "2024-02-27", + "last_updated": "2024-02-27", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 0.0375, + "output": 0.15 }, "type": "chat" }, { - "id": "zai-org/GLM-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "cohere/command-a", + "name": "Cohere: Command A", + "display_name": "Cohere: Command A", "modalities": { "input": [ "text" @@ -42849,41 +43474,28 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 256000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "XiaomiMiMo/MiMo-V2-Flash", - "name": "MiMo-V2-Flash", - "display_name": "MiMo-V2-Flash", + "id": "thedrummer/unslopnemo-12b", + "name": "TheDrummer: UnslopNemo 12B", + "display_name": "TheDrummer: UnslopNemo 12B", "modalities": { "input": [ "text" @@ -42893,30 +43505,28 @@ ] }, "limit": { - "context": 262144, - "output": 4096 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "release_date": "2024-11-09", + "last_updated": "2026-03-15", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "thedrummer/cydonia-24b-v4.1", + "name": "TheDrummer: Cydonia 24B V4.1", + "display_name": "TheDrummer: Cydonia 24B V4.1", "modalities": { "input": [ "text" @@ -42926,41 +43536,28 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "release_date": "2025-09-27", + "last_updated": "2026-03-15", "cost": { - "input": 3, - "output": 5 + "input": 0.3, + "output": 0.5 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "thedrummer/rocinante-12b", + "name": "TheDrummer: Rocinante 12B", + "display_name": "TheDrummer: Rocinante 12B", "modalities": { "input": [ "text" @@ -42970,35 +43567,28 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2024-09-30", + "last_updated": "2026-03-15", "cost": { - "input": 0.28, - "output": 0.4 + "input": 0.17, + "output": 0.43 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "Kimi-K2-Thinking", - "display_name": "Kimi-K2-Thinking", + "id": "thedrummer/skyfall-36b-v2", + "name": "TheDrummer: Skyfall 36B V2", + "display_name": "TheDrummer: Skyfall 36B V2", "modalities": { "input": [ "text" @@ -43008,89 +43598,60 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "release_date": "2025-03-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 0.55, + "output": 0.8 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "Kimi-K2.6", - "display_name": "Kimi-K2.6", + "id": "bytedance/ui-tars-1.5-7b", + "name": "ByteDance: UI-TARS 7B ", + "display_name": "ByteDance: UI-TARS 7B ", "modalities": { "input": [ - "text", "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-20", - "last_updated": "2026-04-20", + "open_weights": false, + "release_date": "2025-07-23", + "last_updated": "2026-03-15", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.1, + "output": 0.2 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct", - "name": "Kimi-K2-Instruct", - "display_name": "Kimi-K2-Instruct", + "id": "alfredpros/codellama-7b-instruct-solidity", + "name": "AlfredPros: CodeLLaMa 7B Instruct Solidity", + "display_name": "AlfredPros: CodeLLaMa 7B Instruct Solidity", "modalities": { "input": [ "text" @@ -43100,29 +43661,28 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 4096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-14", - "last_updated": "2025-07-14", + "release_date": "2025-04-14", + "last_updated": "2026-03-15", "cost": { - "input": 1, - "output": 3 + "input": 0.8, + "output": 1.2 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "Kimi-K2-Instruct-0905", - "display_name": "Kimi-K2-Instruct-0905", + "id": "deepcogito/cogito-v2.1-671b", + "name": "Deep Cogito: Cogito v2.1 671B", + "display_name": "Deep Cogito: Cogito v2.1 671B", "modalities": { "input": [ "text" @@ -43132,34 +43692,33 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 128000, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-04", - "last_updated": "2025-09-04", + "release_date": "2025-11-14", + "last_updated": "2026-03-15", "cost": { - "input": 1, - "output": 3 + "input": 1.25, + "output": 1.25 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi-K2.5", - "display_name": "Kimi-K2.5", + "id": "moonshotai/kimi-k2.5", + "name": "MoonshotAI: Kimi K2.5", + "display_name": "MoonshotAI: Kimi K2.5", "modalities": { "input": [ - "text", "image", - "video" + "text" ], "output": [ "text" @@ -43167,7 +43726,7 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 65535 }, "temperature": true, "tool_call": true, @@ -43188,20 +43747,18 @@ }, "attachment": true, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-01", - "last_updated": "2026-01-01", + "release_date": "2026-01-27", + "last_updated": "2026-03-15", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 0.45, + "output": 2.2 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "moonshotai/kimi-k2-0905", + "name": "MoonshotAI: Kimi K2 0905", + "display_name": "MoonshotAI: Kimi K2 0905", "modalities": { "input": [ "text" @@ -43211,41 +43768,29 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 0.4, + "output": 2, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "moonshotai/kimi-k2-thinking", + "name": "MoonshotAI: Kimi K2 Thinking", + "display_name": "MoonshotAI: Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -43255,8 +43800,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -43277,19 +43822,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2025-11-06", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.47, + "output": 2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "moonshotai/kimi-k2", + "name": "MoonshotAI: Kimi K2 0711", + "display_name": "MoonshotAI: Kimi K2 0711", "modalities": { "input": [ "text" @@ -43299,52 +43844,40 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131000, + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-10", - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "release_date": "2025-07-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.55, + "output": 2.2 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V4-Pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "moonshotai/kimi-k2.6", + "name": "MoonshotAI: Kimi K2.6", + "display_name": "MoonshotAI: Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 262144, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -43354,40 +43887,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2026-04-20", + "last_updated": "2026-05-12", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 0.75, + "output": 3.5, + "cache_read": 0.375 }, "type": "chat" - } - ] - }, - "upstage": { - "id": "upstage", - "name": "Upstage", - "display_name": "Upstage", - "api": "https://api.upstage.ai/v1/solar", - "doc": "https://developers.upstage.ai/docs/apis/chat", - "models": [ + }, { - "id": "solar-pro2", - "name": "solar-pro2", - "display_name": "solar-pro2", + "id": "morph/morph-v3-large", + "name": "Morph: Morph V3 Large", + "display_name": "Morph: Morph V3 Large", "modalities": { "input": [ "text" @@ -43397,30 +43914,28 @@ ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 262144, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 0.25, - "output": 0.25 - }, + "input": 0.9, + "output": 1.9 + }, "type": "chat" }, { - "id": "solar-mini", - "name": "solar-mini", - "display_name": "solar-mini", + "id": "morph/morph-v3-fast", + "name": "Morph: Morph V3 Fast", + "display_name": "Morph: Morph V3 Fast", "modalities": { "input": [ "text" @@ -43430,40 +43945,41 @@ ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 81920, + "output": 38000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-06-12", - "last_updated": "2025-04-22", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.8, + "output": 1.2 }, "type": "chat" }, { - "id": "solar-pro3", - "name": "solar-pro3", - "display_name": "solar-pro3", + "id": "bytedance-seed/seed-1.6-flash", + "name": "ByteDance Seed: Seed 1.6 Flash", + "display_name": "ByteDance Seed: Seed 1.6 Flash", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -43471,41 +43987,33 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-03", - "release_date": "2026-01", - "last_updated": "2026-01", + "attachment": true, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2026-03-15", "cost": { - "input": 0.25, - "output": 0.25 + "input": 0.075, + "output": 0.3 }, "type": "chat" - } - ] - }, - "novita-ai": { - "id": "novita-ai", - "name": "NovitaAI", - "display_name": "NovitaAI", - "api": "https://api.novita.ai/openai", - "doc": "https://novita.ai/docs/guides/introduction", - "models": [ + }, { - "id": "deepseek/deepseek-r1-turbo", - "name": "DeepSeek R1 (Turbo)\t", - "display_name": "DeepSeek R1 (Turbo)\t", + "id": "bytedance-seed/seed-1.6", + "name": "ByteDance Seed: Seed 1.6", + "display_name": "ByteDance Seed: Seed 1.6", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16000 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -43513,153 +44021,160 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-03-05", - "last_updated": "2025-03-05", + "attachment": true, + "open_weights": false, + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 0.7, - "output": 2.5 + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3-0324", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "bytedance-seed/seed-2.0-mini", + "name": "ByteDance Seed: Seed-2.0-Mini", + "display_name": "ByteDance Seed: Seed-2.0-Mini", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "release_date": "2026-02-27", + "last_updated": "2026-03-15", "cost": { - "input": 0.27, - "output": 1.12, - "cache_read": 0.135 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "deepseek/deepseek-ocr-2", - "name": "deepseek/deepseek-ocr-2", - "display_name": "deepseek/deepseek-ocr-2", + "id": "bytedance-seed/seed-2.0-lite", + "name": "ByteDance Seed: Seed-2.0-Lite", + "display_name": "ByteDance Seed: Seed-2.0-Lite", "modalities": { "input": [ + "image", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "release_date": "2026-03-10", + "last_updated": "2026-03-15", "cost": { - "input": 0.03, - "output": 0.03 + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "deepseek/deepseek-ocr", - "name": "DeepSeek-OCR", - "display_name": "DeepSeek-OCR", + "id": "z-ai/glm-5.1", + "name": "Z.ai: GLM 5.1", + "display_name": "Z.ai: GLM 5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 202752, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": true, - "release_date": "2025-10-24", - "last_updated": "2025-10-24", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.03, - "output": 0.03 + "input": 1.26, + "output": 3.96 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill LLama 70B", - "display_name": "DeepSeek R1 Distill LLama 70B", + "id": "z-ai/glm-5v-turbo", + "name": "Z.ai: GLM 5V Turbo", + "display_name": "Z.ai: GLM 5V Turbo", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 202752, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-01-27", - "last_updated": "2025-01-27", + "release_date": "2026-04-01", + "last_updated": "2026-04-11", "cost": { - "input": 0.8, - "output": 0.8 + "input": 1.2, + "output": 4, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "deepseek/deepseek-prover-v2-671b", - "name": "Deepseek Prover V2 671B", - "display_name": "Deepseek Prover V2 671B", + "id": "z-ai/glm-4.5-air", + "name": "Z.ai: GLM 4.5 Air", + "display_name": "Z.ai: GLM 4.5 Air", "modalities": { "input": [ "text" @@ -43669,60 +44184,64 @@ ] }, "limit": { - "context": 160000, - "output": 160000 + "context": 131072, + "output": 98304 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-04-30", - "last_updated": "2025-04-30", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.7, - "output": 2.5 + "input": 0.13, + "output": 0.85, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-0528-qwen3-8b", - "name": "DeepSeek R1 0528 Qwen3 8B", - "display_name": "DeepSeek R1 0528 Qwen3 8B", + "id": "z-ai/glm-4.5v", + "name": "Z.ai: GLM 4.5V", + "display_name": "Z.ai: GLM 4.5V", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 65536, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-05-29", - "last_updated": "2025-05-29", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "cost": { - "input": 0.06, - "output": 0.09 + "input": 0.6, + "output": 1.8, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-distill-qwen-32b", - "name": "DeepSeek R1 Distill Qwen 32B", - "display_name": "DeepSeek R1 Distill Qwen 32B", + "id": "z-ai/glm-4.7-flash", + "name": "Z.ai: GLM 4.7 Flash", + "display_name": "Z.ai: GLM 4.7 Flash", "modalities": { "input": [ "text" @@ -43732,29 +44251,35 @@ ] }, "limit": { - "context": 64000, - "output": 32000 + "context": 202752, + "output": 40551 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.3, - "output": 0.3 + "input": 0.06, + "output": 0.4, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-exp", - "name": "Deepseek V3.2 Exp", - "display_name": "Deepseek V3.2 Exp", + "id": "z-ai/glm-4.6", + "name": "Z.ai: GLM 4.6", + "display_name": "Z.ai: GLM 4.6", "modalities": { "input": [ "text" @@ -43764,8 +44289,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 204800, + "output": 204800 }, "temperature": true, "tool_call": true, @@ -43773,20 +44298,26 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-09-30", + "last_updated": "2026-03-15", "cost": { - "input": 0.27, - "output": 0.41 + "input": 0.39, + "output": 1.9, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "z-ai/glm-4.5", + "name": "Z.ai: GLM 4.5", + "display_name": "Z.ai: GLM 4.5", "modalities": { "input": [ "text" @@ -43797,7 +44328,7 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 98304 }, "temperature": true, "tool_call": true, @@ -43807,19 +44338,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "release_date": "2025-07-28", + "last_updated": "2026-03-15", "cost": { - "input": 0.27, - "output": 1, - "cache_read": 0.135 + "input": 0.6, + "output": 2.2, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2", - "name": "Deepseek V3.2", - "display_name": "Deepseek V3.2", + "id": "z-ai/glm-5-turbo", + "name": "Z.ai: GLM 5 Turbo", + "display_name": "Z.ai: GLM 5 Turbo", "modalities": { "input": [ "text" @@ -43829,8 +44360,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -43840,30 +44371,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2026-03-15", + "last_updated": "2026-04-11", "cost": { - "input": 0.269, - "output": 0.4, - "cache_read": 0.1345 + "input": 1.2, + "output": 4, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3-turbo", - "name": "DeepSeek V3 (Turbo)\t", - "display_name": "DeepSeek V3 (Turbo)\t", + "id": "z-ai/glm-4.7", + "name": "Z.ai: GLM 4.7", + "display_name": "Z.ai: GLM 4.7", "modalities": { "input": [ "text" @@ -43873,28 +44398,41 @@ ] }, "limit": { - "context": 64000, - "output": 16000 + "context": 202752, + "output": 65535 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2025-03-05", - "last_updated": "2025-03-05", + "release_date": "2025-12-22", + "last_updated": "2026-03-15", "cost": { - "input": 0.4, - "output": 1.3 + "input": 0.38, + "output": 1.98, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-distill-qwen-14b", - "name": "DeepSeek R1 Distill Qwen 14B", - "display_name": "DeepSeek R1 Distill Qwen 14B", + "id": "z-ai/glm-4-32b", + "name": "Z.ai: GLM 4 32B ", + "display_name": "Z.ai: GLM 4 32B ", "modalities": { "input": [ "text" @@ -43904,29 +44442,28 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2025-07-25", + "last_updated": "2026-03-15", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", + "id": "z-ai/glm-5", + "name": "Z.ai: GLM 5", + "display_name": "Z.ai: GLM 5", "modalities": { "input": [ "text" @@ -43936,8 +44473,8 @@ ] }, "limit": { - "context": 163840, - "output": 32768 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -43958,23 +44495,23 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "release_date": "2026-02-12", + "last_updated": "2026-03-15", "cost": { - "input": 0.7, - "output": 2.5, - "cache_read": 0.35 + "input": 0.72, + "output": 2.3 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1-terminus", - "name": "Deepseek V3.1 Terminus", - "display_name": "Deepseek V3.1 Terminus", + "id": "z-ai/glm-4.6v", + "name": "Z.ai: GLM 4.6V", + "display_name": "Z.ai: GLM 4.6V", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" @@ -43982,7 +44519,7 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -43990,23 +44527,24 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "release_date": "2025-09-30", + "last_updated": "2026-01-10", "cost": { - "input": 0.27, - "output": 1, - "cache_read": 0.135 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "inclusionai/ling-2.6-1t", - "name": "Ling-2.6-1T", - "display_name": "Ling-2.6-1T", + "id": "openai/gpt-4o", + "name": "OpenAI: GPT-4o", + "display_name": "OpenAI: GPT-4o", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -44014,62 +44552,64 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "attachment": true, + "open_weights": false, + "release_date": "2024-05-13", + "last_updated": "2026-03-15", "cost": { - "input": 0, - "output": 0 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "paddlepaddle/paddleocr-vl", - "name": "PaddleOCR-VL", - "display_name": "PaddleOCR-VL", + "id": "openai/gpt-4o-mini-search-preview", + "name": "OpenAI: GPT-4o-mini Search Preview", + "display_name": "OpenAI: GPT-4o-mini Search Preview", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 16384, + "context": 128000, "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-10-22", - "last_updated": "2025-10-22", + "attachment": false, + "open_weights": false, + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 0.02, - "output": 0.02 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "nousresearch/hermes-2-pro-llama-3-8b", - "name": "Hermes 2 Pro Llama 3 8B", - "display_name": "Hermes 2 Pro Llama 3 8B", + "id": "openai/gpt-5.2", + "name": "OpenAI: GPT-5.2", + "display_name": "OpenAI: GPT-5.2", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -44077,28 +44617,52 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-06-27", - "last_updated": "2024-06-27", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.14, - "output": 0.14 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "zai-org/glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "openai/gpt-3.5-turbo", + "name": "OpenAI: GPT-3.5 Turbo", + "display_name": "OpenAI: GPT-3.5 Turbo", "modalities": { "input": [ "text" @@ -44108,43 +44672,32 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 16385, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": false, + "release_date": "2023-03-01", + "last_updated": "2023-11-06", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "zai-org/glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "openai/o3-pro", + "name": "OpenAI: o3 Pro", + "display_name": "OpenAI: o3 Pro", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -44152,10 +44705,10 @@ ] }, "limit": { - "context": 202800, - "output": 131072 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -44164,29 +44717,31 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-12", + "attachment": true, + "open_weights": false, + "release_date": "2025-04-16", + "last_updated": "2026-03-15", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 20, + "output": 80 }, "type": "chat" }, { - "id": "zai-org/glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "openai/gpt-3.5-turbo-16k", + "name": "OpenAI: GPT-3.5 Turbo 16k", + "display_name": "OpenAI: GPT-3.5 Turbo 16k", "modalities": { "input": [ "text" @@ -44196,43 +44751,32 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 16385, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "open_weights": false, + "release_date": "2023-08-28", + "last_updated": "2026-03-15", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 3, + "output": 4 }, "type": "chat" }, { - "id": "zai-org/glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "openai/gpt-5.4-nano", + "name": "OpenAI: GPT-5.4 Nano", + "display_name": "OpenAI: GPT-5.4 Nano", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -44240,52 +44784,66 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-17", + "last_updated": "2026-04-11", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "zai-org/glm-4.5-air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "openai/gpt-5-image-mini", + "name": "OpenAI: GPT-5 Image Mini", + "display_name": "OpenAI: GPT-5 Image Mini", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ + "image", "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -44293,59 +44851,62 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-10-13", - "last_updated": "2025-10-13", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-16", + "last_updated": "2026-03-15", "cost": { - "input": 0.13, - "output": 0.85 + "input": 2.5, + "output": 2 }, "type": "chat" }, { - "id": "zai-org/glm-4.5v", - "name": "GLM 4.5V", - "display_name": "GLM 4.5V", + "id": "openai/gpt-5.5-pro", + "name": "OpenAI: GPT-5.5 Pro", + "display_name": "OpenAI: GPT-5.5 Pro", "modalities": { "input": [ "text", - "video", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "open_weights": false, + "release_date": "2026-04-24", + "last_updated": "2026-05-01", "cost": { - "input": 0.6, - "output": 1.8, - "cache_read": 0.11 + "input": 30, + "output": 180 }, "type": "chat" }, { - "id": "zai-org/glm-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "openai/gpt-5.1-codex-mini", + "name": "OpenAI: GPT-5.1-Codex-Mini", + "display_name": "OpenAI: GPT-5.1-Codex-Mini", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -44353,79 +44914,109 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 400000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "attachment": true, + "open_weights": false, + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.55, - "output": 2.2, - "cache_read": 0.11 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "zai-org/glm-4.6v", - "name": "GLM 4.6V", - "display_name": "GLM 4.6V", + "id": "openai/gpt-5.2-pro", + "name": "OpenAI: GPT-5.2 Pro", + "display_name": "OpenAI: GPT-5.2 Pro", "modalities": { "input": [ - "text", - "video", - "image" + "image", + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "open_weights": false, + "release_date": "2025-12-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 0.9, - "cache_read": 0.055 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "zai-org/glm-4.7-flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "openai/gpt-4o-2024-05-13", + "name": "OpenAI: GPT-4o (2024-05-13)", + "display_name": "OpenAI: GPT-4o (2024-05-13)", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -44433,99 +45024,117 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "attachment": true, + "open_weights": false, + "release_date": "2024-05-13", + "last_updated": "2026-03-15", "cost": { - "input": 0.07, - "output": 0.4, - "cache_read": 0.01 + "input": 5, + "output": 15 }, "type": "chat" }, { - "id": "zai-org/autoglm-phone-9b-multilingual", - "name": "AutoGLM-Phone-9B-Multilingual", - "display_name": "AutoGLM-Phone-9B-Multilingual", + "id": "openai/gpt-4-0314", + "name": "OpenAI: GPT-4 (older v0314)", + "display_name": "OpenAI: GPT-4 (older v0314)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 8191, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-12-10", - "last_updated": "2025-12-10", + "attachment": false, + "open_weights": false, + "release_date": "2023-05-28", + "last_updated": "2026-03-15", "cost": { - "input": 0.035, - "output": 0.138 + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "mistralai/mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "openai/gpt-5.4-image-2", + "name": "OpenAI: GPT-5.4 Image 2", + "display_name": "OpenAI: GPT-5.4 Image 2", "modalities": { "input": [ - "text" + "image", + "text", + "pdf" ], "output": [ + "image", "text" ] }, "limit": { - "context": 60288, - "output": 16000 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-30", - "last_updated": "2024-07-30", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-04-21", + "last_updated": "2026-05-01", "cost": { - "input": 0.04, - "output": 0.17 + "input": 8, + "output": 15, + "cache_read": 2 }, "type": "chat" }, { - "id": "baichuan/baichuan-m2-32b", - "name": "baichuan-m2-32b", - "display_name": "baichuan-m2-32b", + "id": "openai/gpt-3.5-turbo-instruct", + "name": "OpenAI: GPT-3.5 Turbo Instruct", + "display_name": "OpenAI: GPT-3.5 Turbo Instruct", "modalities": { "input": [ "text" @@ -44535,8 +45144,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 4095, + "output": 4096 }, "temperature": true, "tool_call": false, @@ -44544,21 +45153,20 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-08-13", - "last_updated": "2025-08-13", + "open_weights": false, + "release_date": "2023-03-01", + "last_updated": "2023-09-21", "cost": { - "input": 0.07, - "output": 0.07 + "input": 1.5, + "output": 2 }, "type": "chat" }, { - "id": "meta-llama/llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout Instruct", - "display_name": "Llama 4 Scout Instruct", - "modalities": { + "id": "openai/gpt-5-codex", + "name": "OpenAI: GPT-5 Codex", + "display_name": "OpenAI: GPT-5 Codex", + "modalities": { "input": [ "text", "image" @@ -44568,30 +45176,55 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-04-06", - "last_updated": "2025-04-06", + "open_weights": false, + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.18, - "output": 0.59 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "meta-llama/llama-3.3-70b-instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "openai/gpt-5.1-chat", + "name": "OpenAI: GPT-5.1 Chat", + "display_name": "OpenAI: GPT-5.1 Chat", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -44599,31 +45232,33 @@ ] }, "limit": { - "context": 131072, - "output": 120000 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-07", - "last_updated": "2024-12-07", + "attachment": true, + "open_weights": false, + "release_date": "2025-11-13", + "last_updated": "2026-03-15", "cost": { - "input": 0.135, - "output": 0.4 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "meta-llama/llama-3.2-3b-instruct", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "openai/gpt-4.1", + "name": "OpenAI: GPT-4.1", + "display_name": "OpenAI: GPT-4.1", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -44631,39 +45266,42 @@ ] }, "limit": { - "context": 32768, - "output": 32000 + "context": 1047576, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-09-18", - "last_updated": "2024-09-18", + "attachment": true, + "open_weights": false, + "release_date": "2025-04-14", + "last_updated": "2026-03-15", "cost": { - "input": 0.03, - "output": 0.05 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "meta-llama/llama-3-8b-instruct", - "name": "Llama 3 8B Instruct", - "display_name": "Llama 3 8B Instruct", + "id": "openai/gpt-audio", + "name": "OpenAI: GPT Audio", + "display_name": "OpenAI: GPT Audio", "modalities": { "input": [ + "audio", "text" ], "output": [ + "audio", "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": false, @@ -44671,19 +45309,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-04-25", - "last_updated": "2024-04-25", + "open_weights": false, + "release_date": "2026-01-20", + "last_updated": "2026-03-15", "cost": { - "input": 0.04, - "output": 0.04 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "meta-llama/llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "openai/gpt-4o-search-preview", + "name": "OpenAI: GPT-4o Search Preview", + "display_name": "OpenAI: GPT-4o Search Preview", "modalities": { "input": [ "text" @@ -44693,28 +45331,27 @@ ] }, "limit": { - "context": 16384, + "context": 128000, "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-07-24", - "last_updated": "2024-07-24", + "open_weights": false, + "release_date": "2025-03-13", + "last_updated": "2026-03-15", "cost": { - "input": 0.02, - "output": 0.05 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "meta-llama/llama-3-70b-instruct", - "name": "Llama3 70B Instruct", - "display_name": "Llama3 70B Instruct", + "id": "openai/gpt-oss-20b", + "name": "OpenAI: gpt-oss-20b", + "display_name": "OpenAI: gpt-oss-20b", "modalities": { "input": [ "text" @@ -44724,62 +45361,71 @@ ] }, "limit": { - "context": 8192, - "output": 8000 + "context": 131072, + "output": 26215 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2024-04-25", - "last_updated": "2024-04-25", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.51, - "output": 0.74 + "input": 0.03, + "output": 0.14 }, "type": "chat" }, { - "id": "meta-llama/llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama 4 Maverick Instruct", - "display_name": "Llama 4 Maverick Instruct", + "id": "openai/gpt-oss-safeguard-20b", + "name": "OpenAI: gpt-oss-safeguard-20b", + "display_name": "OpenAI: gpt-oss-safeguard-20b", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 131072, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-04-06", - "last_updated": "2025-04-06", + "attachment": false, + "open_weights": false, + "release_date": "2025-10-29", + "last_updated": "2025-10-29", "cost": { - "input": 0.27, - "output": 0.85 + "input": 0.075, + "output": 0.3, + "cache_read": 0.037 }, "type": "chat" }, { - "id": "gryphe/mythomax-l2-13b", - "name": "Mythomax L2 13B", - "display_name": "Mythomax L2 13B", + "id": "openai/gpt-5-pro", + "name": "OpenAI: GPT-5 Pro", + "display_name": "OpenAI: GPT-5 Pro", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -44787,30 +45433,48 @@ ] }, "limit": { - "context": 4096, - "output": 3200 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-25", - "last_updated": "2024-04-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-06", + "last_updated": "2026-03-15", "cost": { - "input": 0.09, - "output": 0.09 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "sao10k/l31-70b-euryale-v2.2", - "name": "L31 70B Euryale V2.2", - "display_name": "L31 70B Euryale V2.2", + "id": "openai/gpt-4.1-mini", + "name": "OpenAI: GPT-4.1 Mini", + "display_name": "OpenAI: GPT-4.1 Mini", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -44818,28 +45482,29 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-09-19", - "last_updated": "2024-09-19", + "attachment": true, + "open_weights": false, + "release_date": "2025-04-14", + "last_updated": "2026-03-15", "cost": { - "input": 1.48, - "output": 1.48 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "sao10k/l3-70b-euryale-v2.1", - "name": "L3 70B Euryale V2.1\t", - "display_name": "L3 70B Euryale V2.1\t", + "id": "openai/gpt-4-turbo-preview", + "name": "OpenAI: GPT-4 Turbo Preview", + "display_name": "OpenAI: GPT-4 Turbo Preview", "modalities": { "input": [ "text" @@ -44849,8 +45514,8 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -44858,30 +45523,32 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-06-18", - "last_updated": "2024-06-18", + "open_weights": false, + "release_date": "2024-01-25", + "last_updated": "2026-03-15", "cost": { - "input": 1.48, - "output": 1.48 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "sao10k/L3-8B-Stheno-v3.2", - "name": "L3 8B Stheno V3.2", - "display_name": "L3 8B Stheno V3.2", + "id": "openai/gpt-4o-audio-preview", + "name": "OpenAI: GPT-4o Audio", + "display_name": "OpenAI: GPT-4o Audio", "modalities": { "input": [ + "audio", "text" ], "output": [ + "audio", "text" ] }, "limit": { - "context": 8192, - "output": 32000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -44889,52 +45556,58 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-11-29", - "last_updated": "2024-11-29", + "open_weights": false, + "release_date": "2025-08-15", + "last_updated": "2026-03-15", "cost": { - "input": 0.05, - "output": 0.05 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "sao10k/l3-8b-lunaris", - "name": "Sao10k L3 8B Lunaris\t", - "display_name": "Sao10k L3 8B Lunaris\t", + "id": "openai/gpt-5-image", + "name": "OpenAI: GPT-5 Image", + "display_name": "OpenAI: GPT-5 Image", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ + "image", "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-11-28", - "last_updated": "2024-11-28", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-14", + "last_updated": "2026-03-15", "cost": { - "input": 0.05, - "output": 0.05 + "input": 10, + "output": 10 }, "type": "chat" }, { - "id": "microsoft/wizardlm-2-8x22b", - "name": "Wizardlm 2 8x22B", - "display_name": "Wizardlm 2 8x22B", + "id": "openai/gpt-5.1", + "name": "OpenAI: GPT-5.1", + "display_name": "OpenAI: GPT-5.1", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -44942,104 +45615,162 @@ ] }, "limit": { - "context": 65535, - "output": 8000 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-24", - "last_updated": "2024-04-24", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-13", + "last_updated": "2026-03-15", "cost": { - "input": 0.62, - "output": 0.62 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "OpenAI: GPT OSS 20B", - "display_name": "OpenAI: GPT OSS 20B", + "id": "openai/gpt-5-nano", + "name": "OpenAI: GPT-5 Nano", + "display_name": "OpenAI: GPT-5 Nano", "modalities": { "input": [ - "text", - "image" + "image", + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", + "open_weights": false, + "release_date": "2025-08-07", + "last_updated": "2026-03-15", "cost": { - "input": 0.04, - "output": 0.15 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "OpenAI GPT OSS 120B", - "display_name": "OpenAI GPT OSS 120B", + "id": "openai/gpt-5.4", + "name": "OpenAI: GPT-5.4", + "display_name": "OpenAI: GPT-5.4", "modalities": { "input": [ - "text", - "image" + "image", + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1050000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", + "open_weights": false, + "release_date": "2026-03-06", + "last_updated": "2026-03-15", "cost": { - "input": 0.05, - "output": 0.25 + "input": 2.5, + "output": 15 }, "type": "chat" }, { - "id": "minimaxai/minimax-m1-80k", - "name": "MiniMax M1", - "display_name": "MiniMax M1", + "id": "openai/gpt-4-1106-preview", + "name": "OpenAI: GPT-4 Turbo (older v1106)", + "display_name": "OpenAI: GPT-4 Turbo (older v1106)", "modalities": { "input": [ "text" @@ -45049,31 +45780,32 @@ ] }, "limit": { - "context": 1000000, - "output": 40000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "open_weights": false, + "release_date": "2023-11-06", + "last_updated": "2026-03-15", "cost": { - "input": 0.55, - "output": 2.2 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "xiaomimimo/mimo-v2-flash", - "name": "XiaomiMiMo/MiMo-V2-Flash", - "display_name": "XiaomiMiMo/MiMo-V2-Flash", + "id": "openai/gpt-4o-mini", + "name": "OpenAI: GPT-4o-mini", + "display_name": "OpenAI: GPT-4o-mini", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -45081,65 +45813,77 @@ ] }, "limit": { - "context": 262144, - "output": 32000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-12-19", - "last_updated": "2025-12-19", + "attachment": true, + "open_weights": false, + "release_date": "2024-07-18", + "last_updated": "2026-03-15", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.3 + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-vl-28b-a3b-thinking", - "name": "ERNIE-4.5-VL-28B-A3B-Thinking", - "display_name": "ERNIE-4.5-VL-28B-A3B-Thinking", + "id": "openai/o1-pro", + "name": "OpenAI: o1-pro", + "display_name": "OpenAI: o1-pro", "modalities": { "input": [ - "text", "image", - "video" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, - "open_weights": true, - "release_date": "2025-11-26", - "last_updated": "2025-11-26", + "open_weights": false, + "release_date": "2025-03-19", + "last_updated": "2026-03-15", "cost": { - "input": 0.39, - "output": 0.39 + "input": 150, + "output": 600 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-vl-424b-a47b", - "name": "ERNIE 4.5 VL 424B A47B", - "display_name": "ERNIE 4.5 VL 424B A47B", + "id": "openai/gpt-4-turbo", + "name": "OpenAI: GPT-4 Turbo", + "display_name": "OpenAI: GPT-4 Turbo", "modalities": { "input": [ "text", @@ -45150,31 +45894,32 @@ ] }, "limit": { - "context": 123000, - "output": 16000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-06-30", - "last_updated": "2025-06-30", + "open_weights": false, + "release_date": "2023-09-13", + "last_updated": "2024-04-09", "cost": { - "input": 0.42, - "output": 1.25 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-21B-a3b", - "name": "ERNIE 4.5 21B A3B", - "display_name": "ERNIE 4.5 21B A3B", + "id": "openai/gpt-5.4-mini", + "name": "OpenAI: GPT-5.4 Mini", + "display_name": "OpenAI: GPT-5.4 Mini", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -45182,31 +45927,56 @@ ] }, "limit": { - "context": 120000, - "output": 8000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-06-30", - "last_updated": "2025-06-30", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-03-17", + "last_updated": "2026-04-11", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-300b-a47b-paddle", - "name": "ERNIE 4.5 300B A47B", - "display_name": "ERNIE 4.5 300B A47B", + "id": "openai/o1", + "name": "OpenAI: o1", + "display_name": "OpenAI: o1", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -45214,28 +45984,44 @@ ] }, "limit": { - "context": 123000, - "output": 12000 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-30", - "last_updated": "2025-06-30", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-12-05", + "last_updated": "2026-03-15", "cost": { - "input": 0.28, - "output": 1.1 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-21B-a3b-thinking", - "name": "ERNIE-4.5-21B-A3B-Thinking", - "display_name": "ERNIE-4.5-21B-A3B-Thinking", + "id": "openai/gpt-3.5-turbo-0613", + "name": "OpenAI: GPT-3.5 Turbo (older v0613)", + "display_name": "OpenAI: GPT-3.5 Turbo (older v0613)", "modalities": { "input": [ "text" @@ -45245,120 +46031,146 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 4095, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "open_weights": false, + "release_date": "2023-06-13", + "last_updated": "2023-06-13", "cost": { - "input": 0.07, - "output": 0.28 + "input": 1, + "output": 2 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-vl-28b-a3b", - "name": "ERNIE 4.5 VL 28B A3B", - "display_name": "ERNIE 4.5 VL 28B A3B", + "id": "openai/o3-mini-high", + "name": "OpenAI: o3 Mini High", + "display_name": "OpenAI: o3 Mini High", "modalities": { "input": [ - "text", - "image" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 30000, - "output": 8000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, - "open_weights": true, - "release_date": "2025-06-30", - "last_updated": "2025-06-30", + "open_weights": false, + "release_date": "2025-01-31", + "last_updated": "2026-03-15", "cost": { - "input": 1.4, - "output": 5.6 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "minimax/minimax-m2.7", - "name": "MiniMax M2.7", - "display_name": "MiniMax M2.7", + "id": "openai/gpt-5.1-codex-max", + "name": "OpenAI: GPT-5.1-Codex-Max", + "display_name": "OpenAI: GPT-5.1-Codex-Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "minimax/minimax-m2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "openai/gpt-5.5", + "name": "OpenAI: GPT-5.5", + "display_name": "OpenAI: GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -45367,31 +46179,43 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-24", + "last_updated": "2026-05-01", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 5, + "output": 30, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "minimax/minimax-m2.1", - "name": "Minimax M2.1", - "display_name": "Minimax M2.1", + "id": "openai/gpt-5.4-pro", + "name": "OpenAI: GPT-5.4 Pro", + "display_name": "OpenAI: GPT-5.4 Pro", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -45399,42 +46223,52 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1050000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-06", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 30, + "output": 180 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "openai/o4-mini-high", + "name": "OpenAI: o4 Mini High", + "display_name": "OpenAI: o4 Mini High", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -45442,10 +46276,9 @@ ] }, "limit": { - "context": 204800, - "output": 131100 + "context": 200000, + "output": 100000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -45454,31 +46287,35 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2025-04-17", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 1.1, + "output": 4.4 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5-highspeed", - "name": "MiniMax M2.5 Highspeed", - "display_name": "MiniMax M2.5 Highspeed", + "id": "openai/o4-mini-deep-research", + "name": "OpenAI: o4 Mini Deep Research", + "display_name": "OpenAI: o4 Mini Deep Research", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -45486,8 +46323,8 @@ ] }, "limit": { - "context": 204800, - "output": 131100 + "context": 200000, + "output": 100000 }, "temperature": true, "tool_call": true, @@ -45498,31 +46335,36 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2024-06-26", + "last_updated": "2026-03-15", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.03 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "qwen/qwen2.5-7b-instruct", - "name": "Qwen2.5 7B Instruct", - "display_name": "Qwen2.5 7B Instruct", + "id": "openai/gpt-4.1-nano", + "name": "OpenAI: GPT-4.1 Nano", + "display_name": "OpenAI: GPT-4.1 Nano", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -45530,88 +46372,75 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "attachment": true, + "open_weights": false, + "release_date": "2025-04-14", + "last_updated": "2026-03-15", "cost": { - "input": 0.07, - "output": 0.07 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "qwen/qwen3.5-122b-a10b", - "name": "Qwen3.5-122B-A10B", - "display_name": "Qwen3.5-122B-A10B", + "id": "openai/gpt-4", + "name": "OpenAI: GPT-4", + "display_name": "OpenAI: GPT-4", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 8191, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "attachment": false, + "open_weights": false, + "release_date": "2023-03-14", + "last_updated": "2024-04-09", "cost": { - "input": 0.4, - "output": 3.2 + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "qwen/qwen3.6-27b", - "name": "Qwen3.6-27B", - "display_name": "Qwen3.6-27B", + "id": "openai/o4-mini", + "name": "OpenAI: o4 Mini", + "display_name": "OpenAI: o4 Mini", "modalities": { "input": [ - "text", "image", - "video" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -45620,76 +46449,91 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "release_date": "2025-04-16", + "last_updated": "2026-03-15", "cost": { - "input": 0.6, - "output": 3.6 + "input": 1.1, + "output": 4.4, + "cache_read": 0.275 }, "type": "chat" }, { - "id": "qwen/qwen3.5-27b", - "name": "Qwen3.5-27B", - "display_name": "Qwen3.5-27B", + "id": "openai/gpt-5.1-codex", + "name": "OpenAI: GPT-5.1-Codex", + "display_name": "OpenAI: GPT-5.1-Codex", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "open_weights": false, + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.3, - "output": 2.4 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "openai/gpt-4o-2024-11-20", + "name": "OpenAI: GPT-4o (2024-11-20)", + "display_name": "OpenAI: GPT-4o (2024-11-20)", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -45697,7 +46541,7 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 16384 }, "temperature": true, @@ -45705,153 +46549,159 @@ "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-22", - "last_updated": "2025-07-22", + "attachment": true, + "open_weights": false, + "release_date": "2024-11-20", + "last_updated": "2026-03-15", "cost": { - "input": 0.09, - "output": 0.58 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "qwen/qwen3-omni-30b-a3b-instruct", - "name": "Qwen3 Omni 30B A3B Instruct", - "display_name": "Qwen3 Omni 30B A3B Instruct", + "id": "openai/gpt-5.2-codex", + "name": "OpenAI: GPT-5.2-Codex", + "display_name": "OpenAI: GPT-5.2-Codex", "modalities": { "input": [ "text", - "video", - "audio", "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "open_weights": false, + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 0.25, - "output": 0.97, - "input_audio": 2.2, - "output_audio": 1.788 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "qwen/qwen3.5-397b-a17b", - "name": "Qwen3.5-397B-A17B", - "display_name": "Qwen3.5-397B-A17B", + "id": "openai/gpt-5-chat", + "name": "OpenAI: GPT-5 Chat", + "display_name": "OpenAI: GPT-5 Chat", "modalities": { "input": [ - "text", "image", - "video" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 64000 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "open_weights": false, + "release_date": "2025-08-07", + "last_updated": "2026-03-15", "cost": { - "input": 0.6, - "output": 3.6 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen/qwen2.5-vl-72b-instruct", - "name": "Qwen2.5 VL 72B Instruct", - "display_name": "Qwen2.5 VL 72B Instruct", + "id": "openai/gpt-4o-mini-2024-07-18", + "name": "OpenAI: GPT-4o-mini (2024-07-18)", + "display_name": "OpenAI: GPT-4o-mini (2024-07-18)", "modalities": { "input": [ - "text", "image", - "video" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "open_weights": false, + "release_date": "2024-07-18", + "last_updated": "2026-03-15", "cost": { - "input": 0.8, - "output": 0.8 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-235b-a22b-thinking", - "name": "Qwen3 VL 235B A22B Thinking", - "display_name": "Qwen3 VL 235B A22B Thinking", + "id": "openai/gpt-5-mini", + "name": "OpenAI: GPT-5 Mini", + "display_name": "OpenAI: GPT-5 Mini", "modalities": { "input": [ - "text", "image", - "video" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -45859,88 +46709,100 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "open_weights": false, + "release_date": "2025-08-07", + "last_updated": "2026-03-15", "cost": { - "input": 0.98, - "output": 3.95 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-30b-a3b-thinking", - "name": "qwen/qwen3-vl-30b-a3b-thinking", - "display_name": "qwen/qwen3-vl-30b-a3b-thinking", + "id": "openai/o3-mini", + "name": "OpenAI: o3 Mini", + "display_name": "OpenAI: o3 Mini", "modalities": { "input": [ - "text", - "image", - "video" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2025-10-11", - "last_updated": "2025-10-11", + "open_weights": false, + "release_date": "2024-12-20", + "last_updated": "2026-03-15", "cost": { - "input": 0.2, - "output": 1 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "qwen/qwen3-omni-30b-a3b-thinking", - "name": "Qwen3 Omni 30B A3B Thinking", - "display_name": "Qwen3 Omni 30B A3B Thinking", + "id": "openai/gpt-5.3-codex", + "name": "OpenAI: GPT-5.3-Codex", + "display_name": "OpenAI: GPT-5.3-Codex", "modalities": { "input": [ - "text", - "audio", - "video", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -45949,65 +46811,76 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "open_weights": false, + "release_date": "2026-02-25", + "last_updated": "2026-03-15", "cost": { - "input": 0.25, - "output": 0.97, - "input_audio": 2.2, - "output_audio": 1.788 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-8b-instruct", - "name": "qwen/qwen3-vl-8b-instruct", - "display_name": "qwen/qwen3-vl-8b-instruct", + "id": "openai/gpt-5.2-chat", + "name": "OpenAI: GPT-5.2 Chat", + "display_name": "OpenAI: GPT-5.2 Chat", "modalities": { "input": [ - "text", "image", - "video" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-10-17", - "last_updated": "2025-10-17", + "open_weights": false, + "release_date": "2025-12-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.08, - "output": 0.5 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "qwen/qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "openai/gpt-4o-2024-08-06", + "name": "OpenAI: GPT-4o (2024-08-06)", + "display_name": "OpenAI: GPT-4o (2024-08-06)", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -46015,42 +46888,33 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "release_date": "2024-08-06", + "last_updated": "2026-03-15", "cost": { - "input": 2.11, - "output": 8.45 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "qwen/qwen3-32b-fp8", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "openai/gpt-chat-latest", + "name": "OpenAI: GPT Chat Latest", + "display_name": "OpenAI: GPT Chat Latest", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -46058,29 +46922,35 @@ ] }, "limit": { - "context": 40960, - "output": 20000 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-05-05", + "last_updated": "2026-05-07", "cost": { - "input": 0.1, - "output": 0.45 + "input": 5, + "output": 30, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "qwen/qwen3-4b-fp8", - "name": "Qwen3 4B", - "display_name": "Qwen3 4B", + "id": "openai/gpt-oss-120b", + "name": "OpenAI: gpt-oss-120b", + "display_name": "OpenAI: gpt-oss-120b", "modalities": { "input": [ "text" @@ -46090,75 +46960,71 @@ ] }, "limit": { - "context": 128000, - "output": 20000 + "context": 131072, + "output": 26215 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.03, - "output": 0.03 + "input": 0.039, + "output": 0.19 }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-thinking-2507", - "name": "Qwen3 235B A22b Thinking 2507", - "display_name": "Qwen3 235B A22b Thinking 2507", + "id": "openai/gpt-audio-mini", + "name": "OpenAI: GPT Audio Mini", + "display_name": "OpenAI: GPT Audio Mini", "modalities": { "input": [ + "audio", "text" ], "output": [ + "audio", "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "open_weights": false, + "release_date": "2026-01-20", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 3 + "input": 0.6, + "output": 2.4 }, "type": "chat" }, { - "id": "qwen/qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "openai/o3", + "name": "OpenAI: o3", + "display_name": "OpenAI: o3", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -46166,10 +47032,10 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -46178,30 +47044,36 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-10", - "last_updated": "2025-09-10", + "attachment": true, + "open_weights": false, + "release_date": "2025-04-16", + "last_updated": "2026-03-15", "cost": { - "input": 0.15, - "output": 1.5 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "qwen/qwen-mt-plus", - "name": "Qwen MT Plus", - "display_name": "Qwen MT Plus", + "id": "openai/o3-deep-research", + "name": "OpenAI: o3 Deep Research", + "display_name": "OpenAI: o3 Deep Research", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -46209,30 +47081,48 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 200000, + "output": 100000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-03", - "last_updated": "2025-09-03", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-06-26", + "last_updated": "2026-03-15", "cost": { - "input": 0.25, - "output": 0.75 + "input": 10, + "output": 40, + "cache_read": 2.5 }, "type": "chat" }, { - "id": "qwen/qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "openai/gpt-5.3-chat", + "name": "OpenAI: GPT-5.3 Chat", + "display_name": "OpenAI: GPT-5.3 Chat", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -46240,30 +47130,31 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-10", - "last_updated": "2025-09-10", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-04", + "last_updated": "2026-03-15", "cost": { - "input": 0.15, - "output": 1.5 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b-fp8", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "openai/gpt-5", + "name": "OpenAI: GPT-5", + "display_name": "OpenAI: GPT-5", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -46271,29 +47162,51 @@ ] }, "limit": { - "context": 40960, - "output": 20000 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-07", + "last_updated": "2026-03-15", "cost": { - "input": 0.09, - "output": 0.45 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen/qwen3-coder-next", - "name": "Qwen3 Coder Next", - "display_name": "Qwen3 Coder Next", + "id": "relace/relace-apply-3", + "name": "Relace: Relace Apply 3", + "display_name": "Relace: Relace Apply 3", "modalities": { "input": [ "text" @@ -46303,28 +47216,27 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 256000, + "output": 128000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-03", - "last_updated": "2026-02-03", + "open_weights": false, + "release_date": "2025-09-26", + "last_updated": "2026-03-15", "cost": { - "input": 0.2, - "output": 1.5 + "input": 0.85, + "output": 1.25 }, "type": "chat" }, { - "id": "qwen/qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "relace/relace-search", + "name": "Relace: Relace Search", + "display_name": "Relace: Relace Search", "modalities": { "input": [ "text" @@ -46334,8 +47246,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 256000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -46343,25 +47255,22 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "release_date": "2025-12-09", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 1.3 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-30b-a3b-instruct", - "name": "qwen/qwen3-vl-30b-a3b-instruct", - "display_name": "qwen/qwen3-vl-30b-a3b-instruct", + "id": "aion-labs/aion-1.0", + "name": "AionLabs: Aion-1.0", + "display_name": "AionLabs: Aion-1.0", "modalities": { "input": [ - "text", - "video", - "image" + "text" ], "output": [ "text" @@ -46372,24 +47281,25 @@ "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-10-11", - "last_updated": "2025-10-11", + "attachment": false, + "open_weights": false, + "release_date": "2025-02-05", + "last_updated": "2026-03-15", "cost": { - "input": 0.2, - "output": 0.7 + "input": 4, + "output": 8 }, "type": "chat" }, { - "id": "qwen/qwen3-coder-30b-a3b-instruct", - "name": "Qwen3 Coder 30b A3B Instruct", - "display_name": "Qwen3 Coder 30b A3B Instruct", + "id": "aion-labs/aion-rp-llama-3.1-8b", + "name": "AionLabs: Aion-RP 1.0 (8B)", + "display_name": "AionLabs: Aion-RP 1.0 (8B)", "modalities": { "input": [ "text" @@ -46399,28 +47309,28 @@ ] }, "limit": { - "context": 160000, + "context": 32768, "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-10-09", - "last_updated": "2025-10-09", + "open_weights": false, + "release_date": "2025-02-05", + "last_updated": "2026-03-15", "cost": { - "input": 0.07, - "output": 0.27 + "input": 0.8, + "output": 1.6 }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-fp8", - "name": "Qwen3 235B A22B", - "display_name": "Qwen3 235B A22B", + "id": "aion-labs/aion-2.0", + "name": "AionLabs: Aion-2.0", + "display_name": "AionLabs: Aion-2.0", "modalities": { "input": [ "text" @@ -46430,8 +47340,8 @@ ] }, "limit": { - "context": 40960, - "output": 20000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": false, @@ -46440,19 +47350,19 @@ "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "open_weights": false, + "release_date": "2026-02-24", + "last_updated": "2026-03-15", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.8, + "output": 1.6 }, "type": "chat" }, { - "id": "qwen/qwen3-8b-fp8", - "name": "Qwen3 8B", - "display_name": "Qwen3 8B", + "id": "aion-labs/aion-1.0-mini", + "name": "AionLabs: Aion-1.0-Mini", + "display_name": "AionLabs: Aion-1.0-Mini", "modalities": { "input": [ "text" @@ -46462,8 +47372,8 @@ ] }, "limit": { - "context": 128000, - "output": 20000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": false, @@ -46472,54 +47382,53 @@ "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "open_weights": false, + "release_date": "2025-02-05", + "last_updated": "2026-03-15", "cost": { - "input": 0.035, - "output": 0.138 + "input": 0.7, + "output": 1.4 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-235b-a22b-instruct", - "name": "Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen3 VL 235B A22B Instruct", + "id": "openrouter/pareto-code", + "name": "Pareto Code Router", + "display_name": "Pareto Code Router", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "attachment": false, + "open_weights": false, + "release_date": "2026-04-21", + "last_updated": "2026-05-01", "cost": { - "input": 0.3, - "output": 1.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwen-2.5-72b-instruct", - "name": "Qwen 2.5 72B Instruct", - "display_name": "Qwen 2.5 72B Instruct", + "id": "openrouter/free", + "name": "Free Models Router", + "display_name": "Free Models Router", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -46527,42 +47436,40 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 200000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-10-15", - "last_updated": "2024-10-15", + "attachment": true, + "open_weights": false, + "release_date": "2026-02-01", + "last_updated": "2026-03-15", "cost": { - "input": 0.38, - "output": 0.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwen3.5-35b-a3b", - "name": "Qwen3.5-35B-A3B", - "display_name": "Qwen3.5-35B-A3B", + "id": "openrouter/owl-alpha", + "name": "Owl Alpha", + "display_name": "Owl Alpha", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1048756, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -46570,31 +47477,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "attachment": false, + "open_weights": false, + "release_date": "2026-04-28", + "last_updated": "2026-04-30", "cost": { - "input": 0.25, - "output": 2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "kwaipilot/kat-coder-pro", - "name": "Kat Coder Pro", - "display_name": "Kat Coder Pro", + "id": "openrouter/bodybuilder", + "name": "Body Builder (beta)", + "display_name": "Body Builder (beta)", "modalities": { "input": [ "text" @@ -46604,41 +47500,43 @@ ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 128000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-05", - "last_updated": "2026-01-05", + "open_weights": false, + "release_date": "2026-03-15", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemma-4-31b-it", - "name": "Gemma 4 31B", - "display_name": "Gemma 4 31B", + "id": "openrouter/auto", + "name": "Auto Router", + "display_name": "Auto Router", "modalities": { "input": [ + "audio", + "image", + "pdf", "text", - "image" + "video" ], "output": [ + "image", "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 2000000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -46647,23 +47545,22 @@ "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": false, + "release_date": "2026-03-15", + "last_updated": "2026-03-15", "cost": { - "input": 0.14, - "output": 0.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemma-3-12b-it", - "name": "Gemma 3 12B", - "display_name": "Gemma 3 12B", + "id": "switchpoint/router", + "name": "Switchpoint Router", + "display_name": "Switchpoint Router", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -46671,28 +47568,59 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 32768 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-07-12", + "last_updated": "2026-03-15", + "cost": { + "input": 0.85, + "output": 3.4 + }, + "type": "chat" + }, + { + "id": "mancer/weaver", + "name": "Mancer: Weaver (alpha)", + "display_name": "Mancer: Weaver (alpha)", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8000, + "output": 2000 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "attachment": false, + "open_weights": false, + "release_date": "2023-08-02", + "last_updated": "2026-03-15", "cost": { - "input": 0.05, - "output": 0.1 + "input": 0.75, + "output": 1 }, "type": "chat" }, { - "id": "google/gemma-3-27b-it", - "name": "Gemma 3 27B", - "display_name": "Gemma 3 27B", + "id": "amazon/nova-pro-v1", + "name": "Amazon: Nova Pro 1.0", + "display_name": "Amazon: Nova Pro 1.0", "modalities": { "input": [ "text", @@ -46703,40 +47631,42 @@ ] }, "limit": { - "context": 98304, - "output": 16384 + "context": 300000, + "output": 5120 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "open_weights": false, + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.119, - "output": 0.2 + "input": 0.8, + "output": 3.2 }, "type": "chat" }, { - "id": "google/gemma-4-26b-a4b-it", - "name": "Gemma 4 26B A4B", - "display_name": "Gemma 4 26B A4B", + "id": "amazon/nova-2-lite-v1", + "name": "Amazon: Nova 2 Lite", + "display_name": "Amazon: Nova 2 Lite", "modalities": { "input": [ + "image", + "pdf", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 1000000, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -46745,66 +47675,83 @@ "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2026-03-15", "cost": { - "input": 0.13, - "output": 0.4 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "amazon/nova-lite-v1", + "name": "Amazon: Nova Lite 1.0", + "display_name": "Amazon: Nova Lite 1.0", "modalities": { "input": [ - "text", "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 300000, + "output": 5120 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": true, + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2026-03-15", + "cost": { + "input": 0.06, + "output": 0.24 + }, + "type": "chat" + }, + { + "id": "amazon/nova-premier-v1", + "name": "Amazon: Nova Premier 1.0", + "display_name": "Amazon: Nova Premier 1.0", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "open_weights": false, + "release_date": "2025-11-01", + "last_updated": "2026-03-15", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 2.5, + "output": 12.5 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "amazon/nova-micro-v1", + "name": "Amazon: Nova Micro 1.0", + "display_name": "Amazon: Nova Micro 1.0", "modalities": { "input": [ "text" @@ -46814,8 +47761,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 5120 }, "temperature": true, "tool_call": true, @@ -46823,19 +47770,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2026-03-15", "cost": { - "input": 0.57, - "output": 2.3 + "input": 0.035, + "output": 0.14 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "writer/palmyra-x5", + "name": "Writer: Palmyra X5", + "display_name": "Writer: Palmyra X5", "modalities": { "input": [ "text" @@ -46845,76 +47792,59 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1040000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "open_weights": false, + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { "input": 0.6, - "output": 2.5 + "output": 6 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "inflection/inflection-3-productivity", + "name": "Inflection: Inflection 3 Productivity", + "display_name": "Inflection: Inflection 3 Productivity", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 8000, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "attachment": false, + "open_weights": false, + "release_date": "2024-10-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "inflection/inflection-3-pi", + "name": "Inflection: Inflection 3 Pi", + "display_name": "Inflection: Inflection 3 Pi", "modalities": { "input": [ "text" @@ -46924,40 +47854,28 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 8000, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-11-07", - "last_updated": "2025-11-07", + "open_weights": false, + "release_date": "2024-10-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.6, - "output": 2.5 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "minimax/minimax-m2.1", + "name": "MiniMax: MiniMax M2.1", + "display_name": "MiniMax: MiniMax M2.1", "modalities": { "input": [ "text" @@ -46967,8 +47885,8 @@ ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 196608, + "output": 39322 }, "temperature": true, "tool_call": true, @@ -46978,31 +47896,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 0.27, + "output": 0.95, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "minimax/minimax-m2", + "name": "MiniMax: MiniMax M2", + "display_name": "MiniMax: MiniMax M2", "modalities": { "input": [ "text" @@ -47012,8 +47923,8 @@ ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 196608, + "output": 196608 }, "temperature": true, "tool_call": true, @@ -47023,70 +47934,56 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2025-10-23", + "last_updated": "2026-03-15", "cost": { - "input": 1.69, - "output": 3.38, - "cache_read": 0.13 + "input": 0.255, + "output": 1, + "cache_read": 0.03 }, "type": "chat" - } - ] - }, - "xiaomi-token-plan-cn": { - "id": "xiaomi-token-plan-cn", - "name": "Xiaomi Token Plan (China)", - "display_name": "Xiaomi Token Plan (China)", - "api": "https://token-plan-cn.xiaomimimo.com/v1", - "doc": "https://platform.xiaomimimo.com/#/docs", - "models": [ + }, { - "id": "mimo-v2-tts", - "name": "MiMo-V2-TTS", - "display_name": "MiMo-V2-TTS", + "id": "minimax/minimax-m1", + "name": "MiniMax: MiniMax M1", + "display_name": "MiniMax: MiniMax M1", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 16384 + "context": 1000000, + "output": 40000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0, - "output": 0 + "input": 0.4, + "output": 2.2 }, "type": "chat" }, { - "id": "mimo-v2.5-pro", - "name": "MiMo-V2.5-Pro", - "display_name": "MiMo-V2.5-Pro", + "id": "minimax/minimax-m2.5", + "name": "MiniMax: MiniMax M2.5", + "display_name": "MiniMax: MiniMax M2.5", "modalities": { "input": [ "text" @@ -47096,8 +47993,8 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 196608, + "output": 196608 }, "temperature": true, "tool_call": true, @@ -47107,98 +48004,65 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2026-02-12", + "last_updated": "2026-03-15", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "context_over_200k": { - "input": 0, - "output": 0, - "cache_read": 0 - } + "input": 0.25, + "output": 1.2, + "cache_read": 0.029 }, "type": "chat" }, { - "id": "mimo-v2-omni", - "name": "MiMo-V2-Omni", - "display_name": "MiMo-V2-Omni", + "id": "minimax/minimax-m2-her", + "name": "MiniMax: MiniMax M2-her", + "display_name": "MiniMax: MiniMax M2-her", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 65536, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": false, + "open_weights": true, + "release_date": "2026-01-23", + "last_updated": "2026-03-15", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "mimo-v2.5", - "name": "MiMo-V2.5", - "display_name": "MiMo-V2.5", + "id": "minimax/minimax-m2.7", + "name": "MiniMax: MiniMax M2.7", + "display_name": "MiniMax: MiniMax M2.7", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 204800, "output": 131072 }, "temperature": true, @@ -47218,79 +48082,57 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "context_over_200k": { - "input": 0, - "output": 0, - "cache_read": 0 - } + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "mimo-v2-pro", - "name": "MiMo-V2-Pro", - "display_name": "MiMo-V2-Pro", + "id": "minimax/minimax-01", + "name": "MiniMax: MiniMax-01", + "display_name": "MiniMax: MiniMax-01", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 1000192, + "output": 1000192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": true, + "release_date": "2025-01-15", + "last_updated": "2025-01-15", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0.2, + "output": 1.1 }, "type": "chat" }, { - "id": "mimo-v2-flash", - "name": "MiMo-V2-Flash", - "display_name": "MiMo-V2-Flash", + "id": "x-ai/grok-4.20", + "name": "xAI: Grok 4.20", + "display_name": "xAI: Grok 4.20", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -47298,8 +48140,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, @@ -47307,42 +48149,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-31", + "last_updated": "2026-04-11", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 2, + "output": 6, + "cache_read": 0.2 }, "type": "chat" - } - ] - }, - "wandb": { - "id": "wandb", - "name": "Weights & Biases", - "display_name": "Weights & Biases", - "api": "https://api.inference.wandb.ai/v1", - "doc": "https://docs.wandb.ai/guides/integrations/inference/", - "models": [ + }, { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", + "id": "x-ai/grok-code-fast-1:optimized:free", + "name": "xAI: Grok Code Fast 1 Optimized (experimental, free)", + "display_name": "xAI: Grok Code Fast 1 Optimized (experimental, free)", "modalities": { "input": [ "text" @@ -47352,30 +48173,33 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 10000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-29", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2025-08-27", + "last_updated": "2026-03-15", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "x-ai/grok-4.20-multi-agent", + "name": "xAI: Grok 4.20 Multi-Agent", + "display_name": "xAI: Grok 4.20 Multi-Agent", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -47383,40 +48207,43 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 2000000, + "output": 2000000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2026-03-12", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-31", + "last_updated": "2026-04-11", "cost": { - "input": 0.1, - "output": 0.1 + "input": 2, + "output": 6, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen3-235B-A22B-Thinking-2507", + "id": "x-ai/grok-4.3", + "name": "xAI: Grok 4.3", + "display_name": "xAI: Grok 4.3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -47426,30 +48253,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-25", - "last_updated": "2026-03-12", + "attachment": true, + "open_weights": false, + "release_date": "2026-05-01", + "last_updated": "2026-05-01", "cost": { - "input": 0.1, - "output": 0.1 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen3-Coder-480B-A35B-Instruct", - "display_name": "Qwen3-Coder-480B-A35B-Instruct", + "id": "kwaipilot/kat-coder-pro-v2", + "name": "Kwaipilot: KAT-Coder-Pro V2", + "display_name": "Kwaipilot: KAT-Coder-Pro V2", "modalities": { "input": [ "text" @@ -47459,8 +48280,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 80000 }, "temperature": true, "tool_call": true, @@ -47469,19 +48290,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2026-03-12", + "release_date": "2026-03-27", + "last_updated": "2026-04-11", "cost": { - "input": 1, - "output": 1.5 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "zai-org/GLM-5-FP8", - "name": "GLM 5", - "display_name": "GLM 5", + "id": "nousresearch/hermes-4-405b", + "name": "Nous: Hermes 4 405B", + "display_name": "Nous: Hermes 4 405B", "modalities": { "input": [ "text" @@ -47491,62 +48312,60 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 131072, + "output": 26215 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-03-12", + "release_date": "2025-08-25", + "last_updated": "2025-08-25", "cost": { "input": 1, - "output": 3.2 + "output": 3 }, "type": "chat" }, { - "id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", - "name": "Llama 4 Scout 17B 16E Instruct", - "display_name": "Llama 4 Scout 17B 16E Instruct", + "id": "nousresearch/hermes-3-llama-3.1-405b", + "name": "Nous: Hermes 3 405B Instruct", + "display_name": "Nous: Hermes 3 405B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 64000 + "context": 131072, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-31", - "last_updated": "2026-03-12", + "release_date": "2024-08-16", + "last_updated": "2024-08-16", "cost": { - "input": 0.17, - "output": 0.66 + "input": 1, + "output": 1 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "nousresearch/hermes-4-70b", + "name": "Nous: Hermes 4 70B", + "display_name": "Nous: Hermes 4 70B", "modalities": { "input": [ "text" @@ -47556,30 +48375,30 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2026-03-12", + "release_date": "2025-08-25", + "last_updated": "2026-03-15", "cost": { - "input": 0.71, - "output": 0.71 + "input": 0.13, + "output": 0.4, + "cache_read": 0.055 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.1-8B-Instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", + "id": "nousresearch/hermes-3-llama-3.1-70b", + "name": "Nous: Hermes 3 70B Instruct", + "display_name": "Nous: Hermes 3 70B Instruct", "modalities": { "input": [ "text" @@ -47589,30 +48408,28 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2026-03-12", + "release_date": "2024-08-18", + "last_updated": "2026-03-15", "cost": { - "input": 0.22, - "output": 0.22 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.1-70B-Instruct", - "name": "Llama 3.1 70B", - "display_name": "Llama 3.1 70B", + "id": "nousresearch/hermes-2-pro-llama-3-8b", + "name": "NousResearch: Hermes 2 Pro - Llama-3 8B", + "display_name": "NousResearch: Hermes 2 Pro - Llama-3 8B", "modalities": { "input": [ "text" @@ -47622,28 +48439,28 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2026-03-12", + "release_date": "2024-05-27", + "last_updated": "2024-06-27", "cost": { - "input": 0.8, - "output": 0.8 + "input": 0.14, + "output": 0.14 }, "type": "chat" }, { - "id": "OpenPipe/Qwen3-14B-Instruct", - "name": "OpenPipe Qwen3 14B Instruct", - "display_name": "OpenPipe Qwen3 14B Instruct", + "id": "nvidia/llama-3.3-nemotron-super-49b-v1.5", + "name": "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5", + "display_name": "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5", "modalities": { "input": [ "text" @@ -47653,28 +48470,29 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 131072, + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2025-03-16", + "last_updated": "2025-03-16", "cost": { - "input": 0.05, - "output": 0.22 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "microsoft/Phi-4-mini-instruct", - "name": "Phi-4-mini-instruct", - "display_name": "Phi-4-mini-instruct", + "id": "nvidia/nemotron-3-super-120b-a12b:free", + "name": "NVIDIA: Nemotron 3 Super (free)", + "display_name": "NVIDIA: Nemotron 3 Super (free)", "modalities": { "input": [ "text" @@ -47684,8 +48502,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -47695,19 +48513,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2026-03-12", + "release_date": "2026-03-12", + "last_updated": "2026-03-15", "cost": { - "input": 0.08, - "output": 0.35 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "nvidia/NVIDIA-Nemotron-3-Super-120B-A12B-FP8", - "name": "NVIDIA Nemotron 3 Super 120B", - "display_name": "NVIDIA Nemotron 3 Super 120B", + "id": "nvidia/nemotron-3-super-120b-a12b", + "name": "NVIDIA: Nemotron 3 Super", + "display_name": "NVIDIA: Nemotron 3 Super", "modalities": { "input": [ "text" @@ -47723,22 +48540,24 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, "release_date": "2026-03-11", - "last_updated": "2026-03-12", + "last_updated": "2026-04-11", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.1, + "output": 0.5, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "nvidia/nemotron-nano-9b-v2", + "name": "NVIDIA: Nemotron Nano 9B V2", + "display_name": "NVIDIA: Nemotron Nano 9B V2", "modalities": { "input": [ "text" @@ -47748,64 +48567,64 @@ ] }, "limit": { - "context": 161000, - "output": 161000 + "context": 131072, + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-08-21", - "last_updated": "2026-03-12", + "release_date": "2025-08-18", + "last_updated": "2025-08-18", "cost": { - "input": 0.55, - "output": 1.65 + "input": 0.04, + "output": 0.16 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "gpt-oss-20b", - "display_name": "gpt-oss-20b", + "id": "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free", + "name": "NVIDIA: Nemotron 3 Nano Omni (free)", + "display_name": "NVIDIA: Nemotron 3 Nano Omni (free)", "modalities": { "input": [ - "text" + "text", + "audio", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2026-03-12", + "release_date": "2026-04-28", + "last_updated": "2026-05-01", "cost": { - "input": 0.05, - "output": 0.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "nvidia/nemotron-3-nano-30b-a3b", + "name": "NVIDIA: Nemotron 3 Nano 30B A3B", + "display_name": "NVIDIA: Nemotron 3 Nano 30B A3B", "modalities": { "input": [ "text" @@ -47815,79 +48634,92 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 52429 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2026-03-12", + "open_weights": true, + "release_date": "2024-12", + "last_updated": "2026-02-04", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.05, + "output": 0.2 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "anthropic/claude-sonnet-4.6", + "name": "Anthropic: Claude Sonnet 4.6", + "display_name": "Anthropic: Claude Sonnet 4.6", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, - "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-03-12", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-15", "cost": { - "input": 0.5, - "output": 2.85 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "anthropic/claude-opus-4.6-fast", + "name": "Anthropic: Claude Opus 4.6 (Fast)", + "display_name": "Anthropic: Claude Opus 4.6 (Fast)", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -47895,36 +48727,62 @@ ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true - } + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-03-12", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-04-07", + "last_updated": "2026-04-11", "cost": { - "input": 0.3, - "output": 1.2 + "input": 30, + "output": 150, + "cache_read": 3, + "cache_write": 37.5 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "anthropic/claude-3-haiku", + "name": "Anthropic: Claude 3 Haiku", + "display_name": "Anthropic: Claude 3 Haiku", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -47932,52 +48790,33 @@ }, "limit": { "context": 200000, - "output": 131072 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "release_date": "2024-03-07", + "last_updated": "2024-03-07", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26, - "cache_write": 0 + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 }, "type": "chat" - } - ] - }, - "chutes": { - "id": "chutes", - "name": "Chutes", - "display_name": "Chutes", - "api": "https://llm.chutes.ai/v1", - "doc": "https://llm.chutes.ai/v1/models", - "models": [ + }, { - "id": "NousResearch/DeepHermes-3-Mistral-24B-Preview", - "name": "DeepHermes 3 Mistral 24B Preview", - "display_name": "DeepHermes 3 Mistral 24B Preview", + "id": "anthropic/claude-sonnet-4.5", + "name": "Anthropic: Claude Sonnet 4.5", + "display_name": "Anthropic: Claude Sonnet 4.5", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -47985,31 +48824,35 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "release_date": "2025-09-29", + "last_updated": "2026-03-15", "cost": { - "input": 0.0245, - "output": 0.0978, - "cache_read": 0.01225 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "NousResearch/Hermes-4-14B", - "name": "Hermes 4 14B", - "display_name": "Hermes 4 14B", + "id": "anthropic/claude-opus-4.7-fast", + "name": "Anthropic: Claude Opus 4.7 (Fast)", + "display_name": "Anthropic: Claude Opus 4.7 (Fast)", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -48017,87 +48860,121 @@ ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], "interleaved": true, "summaries": true, - "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "release_date": "2026-05-12", + "last_updated": "2026-05-16", "cost": { - "input": 0.0136, - "output": 0.0543, - "cache_read": 0.0068 + "input": 30, + "output": 150, + "cache_read": 3, + "cache_write": 37.5 }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "anthropic/claude-opus-4.6", + "name": "Anthropic: Claude Opus 4.6", + "display_name": "Anthropic: Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.06, - "output": 0.22, - "cache_read": 0.03 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "Qwen/Qwen3-32B-TEE", - "name": "Qwen3 32B TEE", - "display_name": "Qwen3 32B TEE", + "id": "anthropic/claude-opus-4.1", + "name": "Anthropic: Claude Opus 4.1", + "display_name": "Anthropic: Claude Opus 4.1", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -48105,8 +48982,8 @@ ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -48114,33 +48991,35 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-25", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2026-03-15", "cost": { - "input": 0.08, - "output": 0.24, - "cache_read": 0.04 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "Qwen/Qwen3.6-27B-TEE", - "name": "Qwen3.6 27B TEE", - "display_name": "Qwen3.6 27B TEE", + "id": "anthropic/claude-opus-4", + "name": "Anthropic: Claude Opus 4", + "display_name": "Anthropic: Claude Opus 4", "modalities": { "input": [ - "text", - "image" + "image", + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -48148,34 +49027,25 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-25", - "last_updated": "2026-04-25", + "open_weights": false, + "release_date": "2025-05-22", + "last_updated": "2026-03-15", "cost": { - "input": 0.195, - "output": 1.56, - "cache_read": 0.0975 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-Coder-32B-Instruct", - "name": "Qwen2.5 Coder 32B Instruct", - "display_name": "Qwen2.5 Coder 32B Instruct", + "id": "anthropic/claude-haiku-4.5", + "name": "Anthropic: Claude Haiku 4.5", + "display_name": "Anthropic: Claude Haiku 4.5", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -48183,31 +49053,35 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.0272, - "output": 0.1087, - "cache_read": 0.0136 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "Qwen/Qwen3Guard-Gen-0.6B", - "name": "Qwen3Guard Gen 0.6B", - "display_name": "Qwen3Guard Gen 0.6B", + "id": "anthropic/claude-opus-4.5", + "name": "Anthropic: Claude Opus 4.5", + "display_name": "Anthropic: Claude Opus 4.5", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -48215,31 +49089,35 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "release_date": "2025-11-24", + "last_updated": "2026-03-15", "cost": { - "input": 0.01, - "output": 0.0109, - "cache_read": 0.005 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "anthropic/claude-sonnet-4", + "name": "Anthropic: Claude Sonnet 4", + "display_name": "Anthropic: Claude Sonnet 4", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -48247,93 +49125,125 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "release_date": "2025-05-22", + "last_updated": "2026-03-15", "cost": { - "input": 0.1, - "output": 0.8, - "cache_read": 0.05 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507-TEE", - "name": "Qwen3 235B A22B Instruct 2507 TEE", - "display_name": "Qwen3 235B A22B Instruct 2507 TEE", + "id": "anthropic/claude-3.5-haiku", + "name": "Anthropic: Claude 3.5 Haiku", + "display_name": "Anthropic: Claude 3.5 Haiku", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.1, - "output": 0.6, - "cache_read": 0.05 + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-Next-TEE", - "name": "Qwen3 Coder Next TEE", - "display_name": "Qwen3 Coder Next TEE", + "id": "anthropic/claude-opus-4.7", + "name": "Anthropic: Claude Opus 4.7", + "display_name": "Anthropic: Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-25", - "last_updated": "2026-04-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-04-16", + "last_updated": "2026-05-01", "cost": { - "input": 0.12, - "output": 0.75, - "cache_read": 0.06 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "inclusionai/ring-2.6-1t", + "name": "inclusionAI: Ring-2.6-1T", + "display_name": "inclusionAI: Ring-2.6-1T", "modalities": { "input": [ "text" @@ -48344,7 +49254,7 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -48352,69 +49262,56 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "open_weights": false, + "release_date": "2026-05-08", + "last_updated": "2026-05-16", "cost": { - "input": 0.11, - "output": 0.6, - "cache_read": 0.055 + "input": 0.075, + "output": 0.625, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-32B-Instruct", - "name": "Qwen2.5 VL 32B Instruct", - "display_name": "Qwen2.5 VL 32B Instruct", + "id": "inclusionai/ling-2.6-1t", + "name": "inclusionAI: Ling-2.6-1T", + "display_name": "inclusionAI: Ling-2.6-1T", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 262144, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": false, + "open_weights": false, + "release_date": "2026-04-23", + "last_updated": "2026-05-16", "cost": { - "input": 0.0543, - "output": 0.2174, - "cache_read": 0.02715 + "input": 0.3, + "output": 2.5, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-397B-A17B-TEE", - "name": "Qwen3.5 397B A17B TEE", - "display_name": "Qwen3.5 397B A17B TEE", + "id": "inclusionai/ling-2.6-flash", + "name": "inclusionAI: Ling-2.6 Flash", + "display_name": "inclusionAI: Ling-2.6 Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -48422,72 +49319,60 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-18", - "last_updated": "2026-04-25", + "attachment": false, + "open_weights": false, + "release_date": "2026-04-21", + "last_updated": "2026-05-01", "cost": { - "input": 0.39, - "output": 2.34, - "cache_read": 0.195 + "input": 0.08, + "output": 0.24, + "cache_read": 0.016 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-72B-Instruct", - "name": "Qwen2.5 72B Instruct", - "display_name": "Qwen2.5 72B Instruct", + "id": "mistralai/mistral-large-2512", + "name": "Mistral: Mistral Large 3 2512", + "display_name": "Mistral: Mistral Large 3 2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 262144, + "output": 52429 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2024-11-01", + "last_updated": "2025-12-16", "cost": { - "input": 0.2989, - "output": 1.1957, - "cache_read": 0.14945 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1-TEE", - "name": "GLM 5.1 TEE", - "display_name": "GLM 5.1 TEE", + "id": "mistralai/mistral-7b-instruct-v0.1", + "name": "Mistral: Mistral 7B Instruct v0.1", + "display_name": "Mistral: Mistral 7B Instruct v0.1", "modalities": { "input": [ "text" @@ -48497,41 +49382,28 @@ ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 2824, + "output": 565 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-08", - "last_updated": "2026-04-25", + "open_weights": false, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", "cost": { - "input": 1.05, - "output": 3.5, - "cache_read": 0.525 + "input": 0.11, + "output": 0.19 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7-FP8", - "name": "GLM 4.7 FP8", - "display_name": "GLM 4.7 FP8", + "id": "mistralai/mistral-large-2411", + "name": "Mistral Large 2411", + "display_name": "Mistral Large 2411", "modalities": { "input": [ "text" @@ -48541,30 +49413,28 @@ ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 131072, + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-04-25", + "release_date": "2024-07-24", + "last_updated": "2024-11-04", "cost": { - "input": 0.2989, - "output": 1.1957, - "cache_read": 0.14945 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "zai-org/GLM-5-TEE", - "name": "GLM 5 TEE", - "display_name": "GLM 5 TEE", + "id": "mistralai/mistral-saba", + "name": "Mistral: Saba", + "display_name": "Mistral: Saba", "modalities": { "input": [ "text" @@ -48574,41 +49444,28 @@ ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-14", - "last_updated": "2026-04-25", + "release_date": "2025-02-17", + "last_updated": "2026-03-15", "cost": { - "input": 0.95, - "output": 2.55, - "cache_read": 0.475 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7-TEE", - "name": "GLM 4.7 TEE", - "display_name": "GLM 4.7 TEE", + "id": "mistralai/codestral-2508", + "name": "Mistral: Codestral 2508", + "display_name": "Mistral: Codestral 2508", "modalities": { "input": [ "text" @@ -48618,45 +49475,32 @@ ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 256000, + "output": 51200 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2025-08-01", + "last_updated": "2025-08-01", "cost": { - "input": 0.39, - "output": 1.75, - "cache_read": 0.195 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6V", - "name": "GLM 4.6V", - "display_name": "GLM 4.6V", + "id": "mistralai/mistral-small-3.2-24b-instruct", + "name": "Mistral: Mistral Small 3.2 24B", + "display_name": "Mistral: Mistral Small 3.2 24B", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" @@ -48664,42 +49508,31 @@ }, "limit": { "context": 131072, - "output": 65536 + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2025-06-20", + "last_updated": "2025-06-20", "cost": { - "input": 0.3, - "output": 0.9, - "cache_read": 0.15 + "input": 0.06, + "output": 0.18, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "zai-org/GLM-5-Turbo", - "name": "GLM 5 Turbo", - "display_name": "GLM 5 Turbo", + "id": "mistralai/mistral-small-2603", + "name": "Mistral: Mistral Small 4", + "display_name": "Mistral: Mistral Small 4", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -48707,8 +49540,8 @@ ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -48716,32 +49549,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-03-11", - "last_updated": "2026-04-25", + "release_date": "2026-03-16", + "last_updated": "2026-04-11", "cost": { - "input": 0.4891, - "output": 1.9565, - "cache_read": 0.24455 + "input": 0.15, + "output": 0.6, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "XiaomiMiMo/MiMo-V2-Flash-TEE", - "name": "MiMo V2 Flash TEE", - "display_name": "MiMo V2 Flash TEE", + "id": "mistralai/mistral-nemo", + "name": "Mistral: Mistral Nemo", + "display_name": "Mistral: Mistral Nemo", "modalities": { "input": [ "text" @@ -48751,8 +49573,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -48761,19 +49583,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-04-25", - "last_updated": "2026-04-25", + "release_date": "2024-07-01", + "last_updated": "2024-07-30", "cost": { - "input": 0.09, - "output": 0.29, - "cache_read": 0.045 + "input": 0.02, + "output": 0.04 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "mistralai/devstral-2512", + "name": "Mistral: Devstral 2 2512", + "display_name": "Mistral: Devstral 2 2512", "modalities": { "input": [ "text" @@ -48783,43 +49604,32 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2025-09-12", + "last_updated": "2026-03-15", "cost": { - "input": 0.0272, - "output": 0.1087, - "cache_read": 0.0136 + "input": 0.4, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1-TEE", - "name": "DeepSeek V3.1 TEE", - "display_name": "DeepSeek V3.1 TEE", + "id": "mistralai/mistral-medium-3-5", + "name": "Mistral: Mistral Medium 3.5", + "display_name": "Mistral: Mistral Medium 3.5", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -48827,8 +49637,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -48836,64 +49646,52 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-30", + "last_updated": "2026-05-07", "cost": { - "input": 0.27, - "output": 1, - "cache_read": 0.135 + "input": 1.5, + "output": 7.5 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3-0324-TEE", - "name": "DeepSeek V3 0324 TEE", - "display_name": "DeepSeek V3 0324 TEE", + "id": "mistralai/ministral-14b-2512", + "name": "Mistral: Ministral 3 14B 2512", + "display_name": "Mistral: Ministral 3 14B 2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 262144, + "output": 52429 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 0.25, - "output": 1, - "cache_read": 0.125 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528-TEE", - "name": "DeepSeek R1 0528 TEE", - "display_name": "DeepSeek R1 0528 TEE", + "id": "mistralai/mixtral-8x22b-instruct", + "name": "Mistral: Mixtral 8x22B Instruct", + "display_name": "Mistral: Mixtral 8x22B Instruct", "modalities": { "input": [ "text" @@ -48903,85 +49701,60 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 65536, + "output": 13108 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2024-04-17", + "last_updated": "2024-04-17", "cost": { - "input": 0.45, - "output": 2.15, - "cache_read": 0.225 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2-TEE", - "name": "DeepSeek V3.2 TEE", - "display_name": "DeepSeek V3.2 TEE", + "id": "mistralai/voxtral-small-24b-2507", + "name": "Mistral: Voxtral Small 24B 2507", + "display_name": "Mistral: Voxtral Small 24B 2507", "modalities": { "input": [ - "text" + "text", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 32000, + "output": 6400 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.28, - "output": 0.42, - "cache_read": 0.14 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b-TEE", - "name": "gpt oss 120b TEE", - "display_name": "gpt oss 120b TEE", + "id": "mistralai/devstral-medium", + "name": "Mistral: Devstral Medium", + "display_name": "Mistral: Devstral Medium", "modalities": { "input": [ "text" @@ -48992,44 +49765,31 @@ }, "limit": { "context": 131072, - "output": 65536 + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2025-07-10", + "last_updated": "2025-07-10", "cost": { - "input": 0.09, - "output": 0.36, - "cache_read": 0.045 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "unsloth/gemma-3-12b-it", - "name": "gemma 3 12b it", - "display_name": "gemma 3 12b it", + "id": "mistralai/pixtral-large-2411", + "name": "Mistral: Pixtral Large 2411", + "display_name": "Mistral: Pixtral Large 2411", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" @@ -49037,28 +49797,27 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2024-11-19", + "last_updated": "2026-03-15", "cost": { - "input": 0.03, - "output": 0.1, - "cache_read": 0.015 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "unsloth/Llama-3.2-3B-Instruct", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "mistralai/mistral-large-2407", + "name": "Mistral Large 2407", + "display_name": "Mistral Large 2407", "modalities": { "input": [ "text" @@ -49068,29 +49827,91 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-02-12", - "last_updated": "2026-04-25", + "release_date": "2024-11-19", + "last_updated": "2026-03-15", "cost": { - "input": 0.01, - "output": 0.0136, - "cache_read": 0.005 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "unsloth/gemma-3-4b-it", - "name": "gemma 3 4b it", - "display_name": "gemma 3 4b it", + "id": "mistralai/mistral-large", + "name": "Mistral Large", + "display_name": "Mistral Large", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 25600 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-07-24", + "last_updated": "2025-12-02", + "cost": { + "input": 2, + "output": 6 + }, + "type": "chat" + }, + { + "id": "mistralai/ministral-3b-2512", + "name": "Mistral: Ministral 3 3B 2512", + "display_name": "Mistral: Ministral 3 3B 2512", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-12-02", + "last_updated": "2026-03-15", + "cost": { + "input": 0.1, + "output": 0.1 + }, + "type": "chat" + }, + { + "id": "mistralai/mistral-medium-3", + "name": "Mistral: Mistral Medium 3", + "display_name": "Mistral: Mistral Medium 3", "modalities": { "input": [ "text", @@ -49101,29 +49922,28 @@ ] }, "limit": { - "context": 96000, - "output": 96000 + "context": 131072, + "output": 26215 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "open_weights": false, + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0.01, - "output": 0.0272, - "cache_read": 0.005 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "unsloth/Llama-3.2-1B-Instruct", - "name": "Llama 3.2 1B Instruct", - "display_name": "Llama 3.2 1B Instruct", + "id": "mistralai/mistral-small-24b-instruct-2501", + "name": "Mistral: Mistral Small 3", + "display_name": "Mistral: Mistral Small 3", "modalities": { "input": [ "text" @@ -49133,29 +49953,28 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 32768, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-04-25", + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.01, - "output": 0.0109, - "cache_read": 0.005 + "input": 0.05, + "output": 0.08 }, "type": "chat" }, { - "id": "unsloth/Mistral-Nemo-Instruct-2407", - "name": "Mistral Nemo Instruct 2407", - "display_name": "Mistral Nemo Instruct 2407", + "id": "mistralai/devstral-small", + "name": "Mistral: Devstral Small 1.1", + "display_name": "Mistral: Devstral Small 1.1", "modalities": { "input": [ "text" @@ -49166,40 +49985,39 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 26215 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2025-05-07", + "last_updated": "2025-07-10", "cost": { - "input": 0.02, - "output": 0.04, - "cache_read": 0.01 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "unsloth/gemma-3-27b-it", - "name": "gemma 3 27b it", - "display_name": "gemma 3 27b it", + "id": "mistralai/ministral-8b-2512", + "name": "Mistral: Ministral 3 8B 2512", + "display_name": "Mistral: Ministral 3 8B 2512", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -49208,19 +50026,18 @@ }, "attachment": true, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2025-12-02", + "last_updated": "2026-03-15", "cost": { - "input": 0.0272, - "output": 0.1087, - "cache_read": 0.0136 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "google/gemma-4-31B-turbo-TEE", - "name": "gemma 4 31B turbo TEE", - "display_name": "gemma 4 31B turbo TEE", + "id": "mistralai/mistral-medium-3.1", + "name": "Mistral: Mistral Medium 3.1", + "display_name": "Mistral: Mistral Medium 3.1", "modalities": { "input": [ "text", @@ -49232,89 +50049,72 @@ }, "limit": { "context": 131072, - "output": 65536 + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-25", - "last_updated": "2026-04-25", + "open_weights": false, + "release_date": "2025-08-12", + "last_updated": "2025-08-12", "cost": { - "input": 0.13, - "output": 0.38, - "cache_read": 0.065 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6-TEE", - "name": "Kimi K2.6 TEE", - "display_name": "Kimi K2.6 TEE", + "id": "mistralai/mistral-small-3.1-24b-instruct", + "name": "Mistral: Mistral Small 3.1 24B", + "display_name": "Mistral: Mistral Small 3.1 24B", "modalities": { "input": [ - "text", "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65535 + "context": 128000, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-04-20", - "last_updated": "2026-04-25", + "release_date": "2025-03-17", + "last_updated": "2026-03-15", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.475 + "input": 0.35, + "output": 0.56, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5-TEE", - "name": "Kimi K2.5 TEE", - "display_name": "Kimi K2.5 TEE", + "id": "qwen/qwen3-vl-8b-thinking", + "name": "Qwen: Qwen3 VL 8B Thinking", + "display_name": "Qwen: Qwen3 VL 8B Thinking", "modalities": { "input": [ - "text", "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65535 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -49334,21 +50134,19 @@ } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2026-01-27", - "last_updated": "2026-04-25", + "open_weights": false, + "release_date": "2025-10-15", + "last_updated": "2025-11-25", "cost": { - "input": 0.44, - "output": 2, - "cache_read": 0.22 + "input": 0.117, + "output": 1.365 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5-TEE", - "name": "MiniMax M2.5 TEE", - "display_name": "MiniMax M2.5 TEE", + "id": "qwen/qwen3-30b-a3b-instruct-2507", + "name": "Qwen: Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen: Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ "text" @@ -49358,7 +50156,41 @@ ] }, "limit": { - "context": 196608, + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-07-29", + "last_updated": "2026-03-15", + "cost": { + "input": 0.09, + "output": 0.3, + "cache_read": 0.04 + }, + "type": "chat" + }, + { + "id": "qwen/qwen3.5-plus-20260420", + "name": "Qwen: Qwen3.5 Plus 2026-04-20", + "display_name": "Qwen: Qwen3.5 Plus 2026-04-20", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, "output": 65536 }, "temperature": true, @@ -49378,21 +50210,20 @@ ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-15", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-27", + "last_updated": "2026-05-01", "cost": { - "input": 0.15, - "output": 1.2, - "cache_read": 0.075 + "input": 0.4, + "output": 2.4 }, "type": "chat" }, { - "id": "rednote-hilab/dots.ocr", - "name": "dots.ocr", - "display_name": "dots.ocr", + "id": "qwen/qwen3-vl-235b-a22b-instruct", + "name": "Qwen: Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen: Qwen3 VL 235B A22B Instruct", "modalities": { "input": [ "text", @@ -49403,40 +50234,42 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 52429 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2025-09-23", + "last_updated": "2026-01-10", "cost": { - "input": 0.01, - "output": 0.0109, - "cache_read": 0.005 + "input": 0.2, + "output": 0.88, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "tngtech/DeepSeek-TNG-R1T2-Chimera-TEE", - "name": "DeepSeek TNG R1T2 Chimera TEE", - "display_name": "DeepSeek TNG R1T2 Chimera TEE", + "id": "qwen/qwen3.6-27b", + "name": "Qwen: Qwen3.6 27B", + "display_name": "Qwen: Qwen3.6 27B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -49444,32 +50277,34 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-25", - "last_updated": "2026-04-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-04-27", + "last_updated": "2026-05-01", "cost": { - "input": 0.3, - "output": 1.1, - "cache_read": 0.15 + "input": 0.325, + "output": 3.25 }, "type": "chat" - } - ] - }, - "dinference": { - "id": "dinference", - "name": "DInference", - "display_name": "DInference", - "api": "https://api.dinference.com/v1", - "doc": "https://dinference.com", - "models": [ + }, { - "id": "gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "qwen/qwen2.5-vl-72b-instruct", + "name": "Qwen: Qwen2.5 VL 72B Instruct", + "display_name": "Qwen: Qwen2.5 VL 72B Instruct", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -49477,44 +50312,42 @@ ] }, "limit": { - "context": 131072, + "context": 32768, "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-08", - "last_updated": "2025-08", + "release_date": "2025-02-01", + "last_updated": "2026-03-15", "cost": { - "input": 0.0675, - "output": 0.27 + "input": 0.8, + "output": 0.8, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "qwen/qwen3.5-plus-02-15", + "name": "Qwen: Qwen3.5 Plus 2026-02-15", + "display_name": "Qwen: Qwen3.5 Plus 2026-02-15", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -49533,23 +50366,23 @@ ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "attachment": true, + "open_weights": false, + "release_date": "2026-02-15", + "last_updated": "2026-03-15", "cost": { - "input": 0.45, - "output": 1.65 + "input": 0.26, + "output": 1.56 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "qwen/qwen3-vl-235b-a22b-thinking", + "name": "Qwen: Qwen3 VL 235B A22B Thinking", + "display_name": "Qwen: Qwen3 VL 235B A22B Thinking", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -49557,8 +50390,8 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -49577,20 +50410,20 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2025-09-24", + "last_updated": "2026-03-15", "cost": { - "input": 0.75, - "output": 2.4 + "input": 0.26, + "output": 2.6 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "qwen/qwen3-8b", + "name": "Qwen: Qwen3 8B", + "display_name": "Qwen: Qwen3 8B", "modalities": { "input": [ "text" @@ -49600,8 +50433,8 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 40960, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -49621,19 +50454,20 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "open_weights": true, + "release_date": "2025-04", + "last_updated": "2026-03-15", "cost": { - "input": 1.25, - "output": 3.89 + "input": 0.05, + "output": 0.4, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "qwen/qwen-2.5-72b-instruct", + "name": "Qwen2.5 72B Instruct", + "display_name": "Qwen2.5 72B Instruct", "modalities": { "input": [ "text" @@ -49643,114 +50477,84 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2024-09", + "last_updated": "2026-01-10", "cost": { - "input": 0.22, - "output": 0.88 + "input": 0.12, + "output": 0.39 }, "type": "chat" - } - ] - }, - "vivgrid": { - "id": "vivgrid", - "name": "Vivgrid", - "display_name": "Vivgrid", - "api": "https://api.vivgrid.com/v1", - "doc": "https://docs.vivgrid.com/models", - "models": [ + }, { - "id": "gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "qwen/qwen3.5-122b-a10b", + "name": "Qwen: Qwen3.5-122B-A10B", + "display_name": "Qwen: Qwen3.5-122B-A10B", "modalities": { "input": [ + "image", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": true, + "open_weights": true, + "release_date": "2026-02-26", + "last_updated": "2026-03-15", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.26, + "output": 2.08 }, "type": "chat" }, { - "id": "gemini-3.1-flash-lite-preview", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "qwen/qwen-plus-2025-07-28:thinking", + "name": "Qwen: Qwen Plus 0728 (thinking)", + "display_name": "Qwen: Qwen Plus 0728 (thinking)", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -49758,43 +50562,31 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "attachment": false, + "open_weights": true, + "release_date": "2025-09-09", + "last_updated": "2026-03-15", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "input": 0.26, + "output": 0.78 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "qwen/qwen3-max-thinking", + "name": "Qwen: Qwen3 Max Thinking", + "display_name": "Qwen: Qwen3 Max Thinking", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -49805,383 +50597,269 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "release_date": "2026-01-23", + "last_updated": "2026-03-15", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.78, + "output": 3.9 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "qwen/qwen3-max", + "name": "Qwen: Qwen3 Max", + "display_name": "Qwen: Qwen3 Max", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 262144, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-09-05", + "last_updated": "2026-03-15", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 + "input": 1.2, + "output": 6, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "qwen/qwen3-235b-a22b-2507", + "name": "Qwen: Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen: Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 52429 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": false, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "open_weights": true, + "release_date": "2025-04", + "last_updated": "2026-01", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.071, + "output": 0.1 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 Mini", - "display_name": "GPT-5.4 Mini", + "id": "qwen/qwen3-235b-a22b", + "name": "Qwen: Qwen3 235B A22B", + "display_name": "Qwen: Qwen3 235B A22B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "release_date": "2024-12-01", + "last_updated": "2026-03-15", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 0.455, + "output": 1.82, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "gpt-5.4-nano", - "name": "GPT-5.4 Nano", - "display_name": "GPT-5.4 Nano", + "id": "qwen/qwen3.5-397b-a17b", + "name": "Qwen: Qwen3.5 397B A17B", + "display_name": "Qwen: Qwen3.5 397B A17B", "modalities": { "input": [ - "text", "image", - "pdf" + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "release_date": "2026-02-15", + "last_updated": "2026-03-15", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 0.39, + "output": 2.34 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "qwen/qwen-2.5-coder-32b-instruct", + "name": "Qwen2.5 Coder 32B Instruct", + "display_name": "Qwen2.5 Coder 32B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32768, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "open_weights": true, + "release_date": "2024-11-11", + "last_updated": "2026-03-15", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.2, + "output": 0.2, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "qwen/qwen3.5-9b", + "name": "Qwen: Qwen3.5-9B", + "display_name": "Qwen: Qwen3.5-9B", "modalities": { "input": [ - "text", "image", - "pdf" + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "open_weights": true, + "release_date": "2026-03-10", + "last_updated": "2026-03-15", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 0.05, + "output": 0.15 }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "qwen/qwen3-coder-next", + "name": "Qwen: Qwen3 Coder Next", + "display_name": "Qwen: Qwen3 Coder Next", "modalities": { "input": [ "text" @@ -50191,106 +50869,75 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2026-02-02", + "last_updated": "2026-03-15", "cost": { - "input": 0.28, - "output": 0.42 + "input": 0.12, + "output": 0.75, + "cache_read": 0.035 }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "qwen/qwen3-coder", + "name": "Qwen: Qwen3 Coder 480B A35B", + "display_name": "Qwen: Qwen3 Coder 480B A35B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 52429 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": true, + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.22, + "output": 1, + "cache_read": 0.022 }, "type": "chat" }, { - "id": "gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "qwen/qwen3.6-plus", + "name": "Qwen: Qwen3.6 Plus", + "display_name": "Qwen: Qwen3.6 Plus", "modalities": { "input": [ - "text", "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 1000000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -50299,45 +50946,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "release_date": "2025-08-26", + "last_updated": "2026-04-11", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 0.325, + "output": 1.95, + "cache_read": 0.0325, + "cache_write": 0.40625 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "qwen/qwen3-coder-flash", + "name": "Qwen: Qwen3 Coder Flash", + "display_name": "Qwen: Qwen3 Coder Flash", "modalities": { "input": [ "text" @@ -50348,62 +50980,39 @@ }, "limit": { "context": 1000000, - "output": 384000 + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "open_weights": false, + "release_date": "2025-07-23", + "last_updated": "2026-03-15", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 0.195, + "output": 0.975, + "cache_read": 0.06 }, "type": "chat" - } - ] - }, - "deepinfra": { - "id": "deepinfra", - "name": "Deep Infra", - "display_name": "Deep Infra", - "doc": "https://deepinfra.com/models", - "models": [ + }, { - "id": "Qwen/Qwen3.5-397B-A17B", - "name": "Qwen 3.5 397B A17B", - "display_name": "Qwen 3.5 397B A17B", + "id": "qwen/qwen3-30b-a3b-thinking-2507", + "name": "Qwen: Qwen3 30B A3B Thinking 2507", + "display_name": "Qwen: Qwen3 30B A3B Thinking 2507", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 81920 + "context": 32768, + "output": 6554 }, "temperature": true, "tool_call": true, @@ -50422,34 +51031,31 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-01", - "last_updated": "2026-04-20", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 0.54, - "output": 3.4 + "input": 0.051, + "output": 0.34 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-35B-A3B", - "name": "Qwen 3.5 35B A3B", - "display_name": "Qwen 3.5 35B A3B", + "id": "qwen/qwen3-32b", + "name": "Qwen: Qwen3 32B", + "display_name": "Qwen: Qwen3 32B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 81920 + "context": 40960, + "output": 40960 }, "temperature": true, "tool_call": true, @@ -50468,53 +51074,21 @@ ] } }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-01", - "last_updated": "2026-04-20", - "cost": { - "input": 0.2, - "output": 0.95 - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo", - "name": "Qwen3 Coder 480B A35B Instruct Turbo", - "display_name": "Qwen3 Coder 480B A35B Instruct Turbo", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 66536 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "release_date": "2024-12-01", + "last_updated": "2026-02-04", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.08, + "output": 0.24, + "cache_read": 0.04 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen: Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen: Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ "text" @@ -50524,33 +51098,44 @@ ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "release_date": "2025-09-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.4, - "output": 1.6 + "input": 0.0975, + "output": 0.78 }, "type": "chat" }, { - "id": "Qwen/Qwen3.6-35B-A3B", - "name": "Qwen3.6 35B A3B", - "display_name": "Qwen3.6 35B A3B", + "id": "qwen/qwen3.5-flash-02-23", + "name": "Qwen: Qwen3.5-Flash", + "display_name": "Qwen: Qwen3.5-Flash", "modalities": { "input": [ - "text", "image", + "text", "video" ], "output": [ @@ -50558,8 +51143,8 @@ ] }, "limit": { - "context": 262144, - "output": 81920 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -50580,18 +51165,18 @@ }, "attachment": true, "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "release_date": "2026-02-26", + "last_updated": "2026-03-15", "cost": { - "input": 0.2, - "output": 1 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7-Flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "qwen/qwen3-30b-a3b", + "name": "Qwen: Qwen3 30B A3B", + "display_name": "Qwen: Qwen3 30B A3B", "modalities": { "input": [ "text" @@ -50601,8 +51186,8 @@ ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 40960, + "output": 40960 }, "temperature": true, "tool_call": true, @@ -50623,21 +51208,22 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "release_date": "2025-04", + "last_updated": "2026-03-15", "cost": { - "input": 0.06, - "output": 0.4 + "input": 0.08, + "output": 0.28, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "qwen/qwen3-vl-30b-a3b-thinking", + "name": "Qwen: Qwen3 VL 30B A3B Thinking", + "display_name": "Qwen: Qwen3 VL 30B A3B Thinking", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -50646,39 +51232,52 @@ }, "limit": { "context": 131072, - "output": 98304 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-10-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0.13, + "output": 1.56 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "qwen/qwen3.5-35b-a3b", + "name": "Qwen: Qwen3.5-35B-A3B", + "display_name": "Qwen: Qwen3.5-35B-A3B", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -50697,36 +51296,36 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2026-02-26", + "last_updated": "2026-03-15", "cost": { - "input": 0.43, - "output": 1.75, - "cache_read": 0.08 + "input": 0.1625, + "output": 1.3 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "qwen/qwen3.6-35b-a3b", + "name": "Qwen: Qwen3.6 35B A3B", + "display_name": "Qwen: Qwen3.6 35B A3B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 262144, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -50742,22 +51341,21 @@ ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-04-07", - "last_updated": "2026-04-07", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-27", + "last_updated": "2026-05-01", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 0.1612, + "output": 0.96525, + "cache_read": 0.1612 }, "type": "chat" }, { - "id": "zai-org/GLM-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "qwen/qwen-plus-2025-07-28", + "name": "Qwen: Qwen Plus 0728", + "display_name": "Qwen: Qwen Plus 0728", "modalities": { "input": [ "text" @@ -50767,14 +51365,13 @@ ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -50789,32 +51386,61 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2025-09-09", + "last_updated": "2026-03-15", "cost": { - "input": 0.8, - "output": 2.56, - "cache_read": 0.16 + "input": 0.26, + "output": 0.78 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6V", - "name": "GLM-4.6V", - "display_name": "GLM-4.6V", + "id": "qwen/qwen3-vl-8b-instruct", + "name": "Qwen: Qwen3 VL 8B Instruct", + "display_name": "Qwen: Qwen3 VL 8B Instruct", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-10-15", + "last_updated": "2025-11-25", + "cost": { + "input": 0.08, + "output": 0.5 + }, + "type": "chat" + }, + { + "id": "qwen/qwen3-235b-a22b-thinking-2507", + "name": "Qwen: Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen: Qwen3 235B A22B Thinking 2507", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -50833,21 +51459,20 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "release_date": "2025-07-25", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.11, + "output": 0.6 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "qwen/qwen3.6-max-preview", + "name": "Qwen: Qwen3.6 Max Preview", + "display_name": "Qwen: Qwen3.6 Max Preview", "modalities": { "input": [ "text" @@ -50857,8 +51482,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -50878,52 +51503,51 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "open_weights": false, + "release_date": "2026-04-27", + "last_updated": "2026-05-01", "cost": { - "input": 0.43, - "output": 1.74, - "cache_read": 0.08 + "input": 1.04, + "output": 6.24, + "cache_write": 1.3 }, "type": "chat" }, { - "id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", - "name": "Llama 4 Scout 17B", - "display_name": "Llama 4 Scout 17B", + "id": "qwen/qwen3-coder-30b-a3b-instruct", + "name": "Qwen: Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen: Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 10000000, - "output": 16384 + "context": 160000, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "cost": { - "input": 0.08, - "output": 0.3 + "input": 0.07, + "output": 0.27 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.1-8B-Instruct", - "name": "Llama 3.1 8B", - "display_name": "Llama 3.1 8B", + "id": "qwen/qwen3-next-80b-a3b-instruct", + "name": "Qwen: Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen: Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ "text" @@ -50934,89 +51558,122 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 52429 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2025-09-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.02, - "output": 0.05 + "input": 0.09, + "output": 1.1 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.1-70B-Instruct", - "name": "Llama 3.1 70B", - "display_name": "Llama 3.1 70B", + "id": "qwen/qwen3.5-27b", + "name": "Qwen: Qwen3.5-27B", + "display_name": "Qwen: Qwen3.5-27B", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2026-02-26", + "last_updated": "2026-03-15", "cost": { - "input": 0.4, - "output": 0.4 + "input": 0.195, + "output": 1.56 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.1-8B-Instruct-Turbo", - "name": "Llama 3.1 8B Turbo", - "display_name": "Llama 3.1 8B Turbo", + "id": "qwen/qwen3.6-flash", + "name": "Qwen: Qwen3.6 Flash", + "display_name": "Qwen: Qwen3.6 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1000000, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-04-27", + "last_updated": "2026-05-01", "cost": { - "input": 0.02, - "output": 0.03 + "input": 0.25, + "output": 1.5, + "cache_write": 0.3125 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct-Turbo", - "name": "Llama 3.3 70B Turbo", - "display_name": "Llama 3.3 70B Turbo", + "id": "qwen/qwen3-vl-30b-a3b-instruct", + "name": "Qwen: Qwen3 VL 30B A3B Instruct", + "display_name": "Qwen: Qwen3 VL 30B A3B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -51024,30 +51681,30 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-10-05", + "last_updated": "2025-11-25", "cost": { - "input": 0.1, - "output": 0.32 + "input": 0.13, + "output": 0.52 }, "type": "chat" }, { - "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", - "name": "Llama 4 Maverick 17B FP8", - "display_name": "Llama 4 Maverick 17B FP8", + "id": "qwen/qwen-plus", + "name": "Qwen: Qwen-Plus", + "display_name": "Qwen: Qwen-Plus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -51055,26 +51712,39 @@ }, "limit": { "context": 1000000, - "output": 16384 + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "release_date": "2024-01-25", + "last_updated": "2025-09-11", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.4, + "output": 1.2, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.1-70B-Instruct-Turbo", - "name": "Llama 3.1 70B Turbo", - "display_name": "Llama 3.1 70B Turbo", + "id": "qwen/qwen3-coder-plus", + "name": "Qwen: Qwen3 Coder Plus", + "display_name": "Qwen: Qwen3 Coder Plus", "modalities": { "input": [ "text" @@ -51084,27 +51754,29 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1000000, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2025-07-01", + "last_updated": "2026-03-15", "cost": { - "input": 0.4, - "output": 0.4 + "input": 0.65, + "output": 3.25, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "qwen/qwen-2.5-7b-instruct", + "name": "Qwen: Qwen2.5 7B Instruct", + "display_name": "Qwen: Qwen2.5 7B Instruct", "modalities": { "input": [ "text" @@ -51114,42 +51786,28 @@ ] }, "limit": { - "context": 163840, - "output": 64000 + "context": 32768, + "output": 6554 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": true, + "release_date": "2024-09", + "last_updated": "2025-04-16", "cost": { - "input": 0.5, - "output": 2.15, - "cache_read": 0.35 + "input": 0.04, + "output": 0.1 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "qwen/qwen3-14b", + "name": "Qwen: Qwen3 14B", + "display_name": "Qwen: Qwen3 14B", "modalities": { "input": [ "text" @@ -51159,8 +51817,8 @@ ] }, "limit": { - "context": 163840, - "output": 64000 + "context": 40960, + "output": 40960 }, "temperature": true, "tool_call": true, @@ -51180,24 +51838,24 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "open_weights": true, + "release_date": "2025-04", + "last_updated": "2026-03-15", "cost": { - "input": 0.26, - "output": 0.38, - "cache_read": 0.13 + "input": 0.06, + "output": 0.24, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "qwen/qwen3-vl-32b-instruct", + "name": "Qwen: Qwen3 VL 32B Instruct", + "display_name": "Qwen: Qwen3 VL 32B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -51205,33 +51863,27 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-21", + "last_updated": "2025-11-25", "cost": { - "input": 0.03, - "output": 0.14 + "input": 0.104, + "output": 0.416 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "tencent/hy3-preview", + "name": "Tencent: Hy3 Preview", + "display_name": "Tencent: Hy3 Preview", "modalities": { "input": [ "text" @@ -51241,8 +51893,8 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -51250,25 +51902,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "release_date": "2026-04-22", + "last_updated": "2026-05-16", "cost": { - "input": 0.05, - "output": 0.24 + "input": 0.066, + "output": 0.26, + "cache_read": 0.029 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "tencent/hunyuan-a13b-instruct", + "name": "Tencent: Hunyuan A13B Instruct", + "display_name": "Tencent: Hunyuan A13B Instruct", "modalities": { "input": [ "text" @@ -51279,56 +51927,44 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-11-06", - "last_updated": "2025-11-07", + "open_weights": false, + "release_date": "2025-06-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.47, - "output": 2 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "google/gemini-3-pro-image-preview", + "name": "Google: Nano Banana Pro (Gemini 3 Pro Image Preview)", + "display_name": "Google: Nano Banana Pro (Gemini 3 Pro Image Preview)", "modalities": { "input": [ - "text", "image", - "video" + "text" ], "output": [ + "image", "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 65536, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -51336,99 +51972,119 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "open_weights": false, + "release_date": "2025-11-20", + "last_updated": "2026-03-15", "cost": { - "input": 0.75, - "output": 3.5, - "cache_read": 0.15 + "input": 2, + "output": 12, + "reasoning": 12 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "moonshotai/Kimi-K2-Instruct", - "name": "Kimi K2", - "display_name": "Kimi K2", + "id": "google/gemma-4-26b-a4b-it", + "name": "Google: Gemma 4 26B A4B", + "display_name": "Google: Gemma 4 26B A4B", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "release_date": "2026-04-03", + "last_updated": "2026-04-11", "cost": { - "input": 0.5, - "output": 2 + "input": 0.12, + "output": 0.4 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "google/gemini-3.1-flash-lite", + "name": "Google: Gemini 3.1 Flash Lite", + "display_name": "Google: Gemini 3.1 Flash Lite", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-05-07", + "last_updated": "2026-05-16", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.15 + "input": 0.25, + "output": 1.5, + "reasoning": 1.5, + "cache_read": 0.025, + "cache_write": 0.08333 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "google/gemini-2.5-pro", + "name": "Google: Gemini 2.5 Pro", + "display_name": "Google: Gemini 2.5 Pro", "modalities": { "input": [ - "text", + "audio", "image", + "pdf", + "text", "video" ], "output": [ @@ -51436,8 +52092,8 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -51448,31 +52104,42 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "open_weights": false, + "release_date": "2025-03-20", + "last_updated": "2026-03-15", "cost": { - "input": 0.5, - "output": 2.8 + "input": 1.25, + "output": 10, + "reasoning": 10, + "cache_read": 0.125, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2", - "name": "MiniMax M2", - "display_name": "MiniMax M2", + "id": "google/gemma-3-27b-it", + "name": "Google: Gemma 3 27B", + "display_name": "Google: Gemma 3 27B", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -51480,51 +52147,41 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-03-12", + "last_updated": "2026-03-15", "cost": { - "input": 0.254, - "output": 1.02 + "input": 0.03, + "output": 0.11, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "google/gemma-4-31b-it", + "name": "Google: Gemma 4 31B", + "display_name": "Google: Gemma 4 31B", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 204800, + "context": 262144, "output": 131072 }, "temperature": true, @@ -51533,178 +52190,162 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2026-04-02", + "last_updated": "2026-04-11", "cost": { - "input": 0.27, - "output": 0.95, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 0.14, + "output": 0.4 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.1", - "name": "MiniMax M2.1", - "display_name": "MiniMax M2.1", + "id": "google/gemini-3.1-flash-image-preview", + "name": "Google: Nano Banana 2 (Gemini 3.1 Flash Image Preview)", + "display_name": "Google: Nano Banana 2 (Gemini 3.1 Flash Image Preview)", "modalities": { "input": [ + "image", "text" ], "output": [ + "image", "text" ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 65536, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "attachment": true, + "open_weights": false, + "release_date": "2026-02-26", + "last_updated": "2026-03-15", "cost": { - "input": 0.28, - "output": 1.2 + "input": 0.5, + "output": 3 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "anthropic/claude-3-7-sonnet-latest", - "name": "Claude Sonnet 3.7 (Latest)", - "display_name": "Claude Sonnet 3.7 (Latest)", + "id": "google/gemini-2.5-pro-preview", + "name": "Google: Gemini 2.5 Pro Preview 06-05", + "display_name": "Google: Gemini 2.5 Pro Preview 06-05", "modalities": { "input": [ - "text", - "image" + "audio", + "image", + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "budget", "budget": { - "min": 1024, + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, "unit": "tokens" }, - "interleaved": false, - "summaries": false, - "visibility": "full", + "summaries": true, + "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "release_date": "2025-06-05", + "last_updated": "2026-03-15", "cost": { - "input": 3.3, - "output": 16.5, - "cache_read": 0.33 + "input": 1.25, + "output": 10, + "reasoning": 10, + "cache_read": 0.125, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "anthropic/claude-4-opus", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "google/gemma-3n-e4b-it", + "name": "Google: Gemma 3n 4B", + "display_name": "Google: Gemma 3n 4B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 32768, + "output": 6554 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-06-12", - "last_updated": "2025-06-12", + "attachment": false, + "open_weights": true, + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 16.5, - "output": 82.5 + "input": 0.02, + "output": 0.04 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V4-Flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "google/gemini-2.5-pro-preview-05-06", + "name": "Google: Gemini 2.5 Pro Preview 05-06", + "display_name": "Google: Gemini 2.5 Pro Preview 05-06", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -51715,192 +52356,248 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "release_date": "2025-05-06", + "last_updated": "2026-03-15", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 1.25, + "output": 10, + "reasoning": 10, + "cache_read": 0.125, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V4-Pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "google/gemini-2.5-flash-lite-preview-09-2025", + "name": "Google: Gemini 2.5 Flash Lite Preview 09-2025", + "display_name": "Google: Gemini 2.5 Flash Lite Preview 09-2025", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 65536, + "context": 1048576, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "release_date": "2025-09-25", + "last_updated": "2026-03-15", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 0.1, + "output": 0.4, + "reasoning": 0.4, + "cache_read": 0.01, + "cache_write": 0.083333 }, "type": "chat" }, { - "id": "google/gemma-4-26B-A4B-it", - "name": "Gemma 4 26B", - "display_name": "Gemma 4 26B", + "id": "google/gemini-2.5-flash-lite", + "name": "Google: Gemini 2.5 Flash Lite", + "display_name": "Google: Gemini 2.5 Flash Lite", "modalities": { "input": [ + "audio", + "image", + "pdf", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-06-17", + "last_updated": "2026-03-15", "cost": { - "input": 0.07, - "output": 0.34 + "input": 0.1, + "output": 0.4, + "reasoning": 0.4, + "cache_read": 0.01, + "cache_write": 0.083333 }, "type": "chat" }, { - "id": "google/gemma-4-31B-it", - "name": "Gemma 4 31B", - "display_name": "Gemma 4 31B", + "id": "google/lyria-3-clip-preview", + "name": "Google: Lyria 3 Clip Preview", + "display_name": "Google: Lyria 3 Clip Preview", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ + "audio", "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-30", + "last_updated": "2026-04-11", "cost": { - "input": 0.13, - "output": 0.38 + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "qiniu-ai": { - "id": "qiniu-ai", - "name": "Qiniu", - "display_name": "Qiniu", - "api": "https://api.qnaigc.com/v1", - "doc": "https://developer.qiniu.com/aitokenapi", - "models": [ + }, { - "id": "qwen3-235b-a22b", - "name": "Qwen 3 235B A22B", - "display_name": "Qwen 3 235B A22B", + "id": "google/gemini-3.1-pro-preview-customtools", + "name": "Google: Gemini 3.1 Pro Preview Custom Tools", + "display_name": "Google: Gemini 3.1 Pro Preview Custom Tools", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-02-26", + "last_updated": "2026-03-15", + "cost": { + "input": 2, + "output": 12, + "reasoning": 12 + }, "type": "chat" }, { - "id": "doubao-seed-1.6-flash", - "name": "Doubao-Seed 1.6 Flash", - "display_name": "Doubao-Seed 1.6 Flash", + "id": "google/gemini-2.0-flash-lite-001", + "name": "Google: Gemini 2.0 Flash Lite", + "display_name": "Google: Gemini 2.0 Flash Lite", "modalities": { "input": [ - "text", + "audio", "image", + "pdf", + "text", "video" ], "output": [ @@ -51908,56 +52605,71 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 1048576, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-08-15", - "last_updated": "2025-08-15", + "release_date": "2024-12-11", + "last_updated": "2026-03-15", + "cost": { + "input": 0.075, + "output": 0.3 + }, "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235b A22B Instruct 2507", - "display_name": "Qwen3 235b A22B Instruct 2507", + "id": "google/gemini-2.0-flash-001", + "name": "Google: Gemini 2.0 Flash", + "display_name": "Google: Gemini 2.0 Flash", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 64000 + "context": 1048576, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-12", - "last_updated": "2025-08-12", + "release_date": "2024-12-11", + "last_updated": "2026-03-15", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025, + "cache_write": 0.083333 + }, "type": "chat" }, { - "id": "doubao-seed-2.0-code", - "name": "Doubao Seed 2.0 Code", - "display_name": "Doubao Seed 2.0 Code", + "id": "google/gemini-3.1-flash-lite-preview", + "name": "Google: Gemini 3.1 Flash Lite Preview", + "display_name": "Google: Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ - "text", + "audio", "image", + "pdf", + "text", "video" ], "output": [ @@ -51965,8 +52677,8 @@ ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -51974,54 +52686,95 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "release_date": "2026-03-03", + "last_updated": "2026-03-15", + "cost": { + "input": 0.25, + "output": 1.5, + "reasoning": 1.5 + }, "type": "chat" }, { - "id": "deepseek-v3-0324", - "name": "DeepSeek-V3-0324", - "display_name": "DeepSeek-V3-0324", + "id": "google/gemini-3.1-pro-preview", + "name": "Google: Gemini 3.1 Pro Preview", + "display_name": "Google: Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-02-19", + "last_updated": "2026-03-15", + "cost": { + "input": 2, + "output": 12, + "reasoning": 12 + }, "type": "chat" }, { - "id": "doubao-1.5-thinking-pro", - "name": "Doubao 1.5 Thinking Pro", - "display_name": "Doubao 1.5 Thinking Pro", + "id": "google/gemini-3-flash-preview", + "name": "Google: Gemini 3 Flash Preview", + "display_name": "Google: Gemini 3 Flash Preview", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -52029,146 +52782,154 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-12-17", + "last_updated": "2026-03-15", + "cost": { + "input": 0.5, + "output": 3, + "reasoning": 3, + "cache_read": 0.05, + "cache_write": 0.083333 + }, "type": "chat" }, { - "id": "claude-3.7-sonnet", - "name": "Claude 3.7 Sonnet", - "display_name": "Claude 3.7 Sonnet", + "id": "google/gemma-2-27b-it", + "name": "Google: Gemma 2 27B", + "display_name": "Google: Gemma 2 27B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2024-06-24", + "last_updated": "2024-06-24", + "cost": { + "input": 0.65, + "output": 0.65 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", "type": "chat" }, { - "id": "qwen3.5-397b-a17b", - "name": "Qwen3.5 397B A17B", - "display_name": "Qwen3.5 397B A17B", + "id": "google/lyria-3-pro-preview", + "name": "Google: Lyria 3 Pro Preview", + "display_name": "Google: Lyria 3 Pro Preview", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ + "audio", "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-02-22", - "last_updated": "2026-02-22", + "release_date": "2026-03-30", + "last_updated": "2026-04-11", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "qwen-vl-max-2025-01-25", - "name": "Qwen VL-MAX-2025-01-25", - "display_name": "Qwen VL-MAX-2025-01-25", + "id": "google/gemma-3-12b-it", + "name": "Google: Gemma 3 12B", + "display_name": "Google: Gemma 3 12B", "modalities": { "input": [ - "text", "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "release_date": "2025-03-13", + "last_updated": "2026-03-15", + "cost": { + "input": 0.04, + "output": 0.13, + "cache_read": 0.015 + }, "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "google/gemini-2.5-flash", + "name": "Google: Gemini 2.5 Flash", + "display_name": "Google: Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 40000, - "output": 4096 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -52179,277 +52940,261 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-07-17", + "last_updated": "2026-03-15", + "cost": { + "input": 0.3, + "output": 2.5, + "reasoning": 2.5, + "cache_read": 0.03, + "cache_write": 0.083333 + }, "type": "chat" }, { - "id": "doubao-1.5-pro-32k", - "name": "Doubao 1.5 Pro 32k", - "display_name": "Doubao 1.5 Pro 32k", + "id": "google/gemini-2.5-flash-image", + "name": "Google: Nano Banana (Gemini 2.5 Flash Image)", + "display_name": "Google: Nano Banana (Gemini 2.5 Flash Image)", "modalities": { "input": [ + "image", "text" ], "output": [ + "image", "text" ] }, "limit": { - "context": 128000, - "output": 12000 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "type": "chat" + "release_date": "2025-10-08", + "last_updated": "2026-03-15", + "cost": { + "input": 0.3, + "output": 2.5 + }, + "type": "imageGeneration" }, { - "id": "qwen2.5-vl-72b-instruct", - "name": "Qwen 2.5 VL 72B Instruct", - "display_name": "Qwen 2.5 VL 72B Instruct", + "id": "google/gemma-3-4b-it", + "name": "Google: Gemma 3 4B", + "display_name": "Google: Gemma 3 4B", "modalities": { "input": [ - "text", "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 19200 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "release_date": "2025-03-13", + "last_updated": "2026-03-15", + "cost": { + "input": 0.04, + "output": 0.08 + }, "type": "chat" }, { - "id": "gemini-2.0-flash", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "microsoft/phi-4", + "name": "Microsoft: Phi 4", + "display_name": "Microsoft: Phi 4", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "cost": { + "input": 0.06, + "output": 0.14 + }, "type": "chat" }, { - "id": "qwen3-vl-30b-a3b-thinking", - "name": "Qwen3-Vl 30b A3b Thinking", - "display_name": "Qwen3-Vl 30b A3b Thinking", + "id": "microsoft/wizardlm-2-8x22b", + "name": "WizardLM-2 8x22B", + "display_name": "WizardLM-2 8x22B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 65535, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2024-04-24", + "last_updated": "2024-04-24", + "cost": { + "input": 0.62, + "output": 0.62 }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-09", - "last_updated": "2026-02-09", "type": "chat" }, { - "id": "gemini-3.0-pro-image-preview", - "name": "Gemini 3.0 Pro Image Preview", - "display_name": "Gemini 3.0 Pro Image Preview", + "id": "microsoft/phi-4-mini-instruct", + "name": "Microsoft: Phi 4 Mini Instruct", + "display_name": "Microsoft: Phi 4 Mini Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2025-10-17", + "last_updated": "2026-05-07", + "cost": { + "input": 0.08, + "output": 0.35, + "cache_read": 0.08 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-20", - "last_updated": "2025-11-20", "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "gryphe/mythomax-l2-13b", + "name": "MythoMax 13B", + "display_name": "MythoMax 13B", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 4096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2024-04-25", + "last_updated": "2024-04-25", + "cost": { + "input": 0.06, + "output": 0.06 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", "type": "chat" }, { - "id": "claude-4.5-opus", - "name": "Claude 4.5 Opus", - "display_name": "Claude 4.5 Opus", + "id": "nex-agi/deepseek-v3.1-nex-n1", + "name": "Nex AGI: DeepSeek V3.1 Nex N1", + "display_name": "Nex AGI: DeepSeek V3.1 Nex N1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 131072, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-25", + "release_date": "2025-01-01", "last_updated": "2025-11-25", + "cost": { + "input": 0.27, + "output": 1 + }, "type": "chat" }, { - "id": "deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "upstage/solar-pro-3", + "name": "Upstage: Solar Pro 3", + "display_name": "Upstage: Solar Pro 3", "modalities": { "input": [ "text" @@ -52460,7 +53205,7 @@ }, "limit": { "context": 128000, - "output": 32000 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -52468,39 +53213,62 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-01-27", + "last_updated": "2026-03-15", + "cost": { + "input": 0.15, + "output": 0.6 + }, "type": "chat" }, { - "id": "claude-4.0-opus", - "name": "Claude 4.0 Opus", - "display_name": "Claude 4.0 Opus", + "id": "anthracite-org/magnum-v4-72b", + "name": "Magnum v4 72B", + "display_name": "Magnum v4 72B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 16384, + "output": 2048 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-10-22", + "last_updated": "2026-03-15", + "cost": { + "input": 3, + "output": 5 + }, + "type": "chat" + }, + { + "id": "deepseek/deepseek-v3.2-exp", + "name": "DeepSeek: DeepSeek V3.2 Exp", + "display_name": "DeepSeek: DeepSeek V3.2 Exp", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -52508,45 +53276,52 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-01-01", + "last_updated": "2025-09-29", + "cost": { + "input": 0.27, + "output": 0.41 + }, "type": "chat" }, { - "id": "claude-4.5-haiku", - "name": "Claude 4.5 Haiku", - "display_name": "Claude 4.5 Haiku", + "id": "deepseek/deepseek-chat", + "name": "DeepSeek: DeepSeek V3", + "display_name": "DeepSeek: DeepSeek V3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-12-01", + "last_updated": "2026-03-15", + "cost": { + "input": 0.32, + "output": 0.89, + "cache_read": 0.15 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-16", - "last_updated": "2025-10-16", "type": "chat" }, { - "id": "qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "deepseek/deepseek-r1", + "name": "DeepSeek: R1", + "display_name": "DeepSeek: R1", "modalities": { "input": [ "text" @@ -52556,13 +53331,14 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 64000, + "output": 16000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -52576,30 +53352,30 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "open_weights": true, + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "cost": { + "input": 0.7, + "output": 2.5 + }, "type": "chat" }, { - "id": "gemini-3.0-flash-preview", - "name": "Gemini 3.0 Flash Preview", - "display_name": "Gemini 3.0 Flash Preview", + "id": "deepseek/deepseek-v4-pro", + "name": "DeepSeek: DeepSeek V4 Pro", + "display_name": "DeepSeek: DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 1048576, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -52610,60 +53386,73 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-18", - "last_updated": "2025-12-18", + "release_date": "2026-04-24", + "last_updated": "2026-05-01", + "cost": { + "input": 0.435, + "output": 0.87, + "cache_read": 0.003625 + }, "type": "chat" }, { - "id": "gemini-2.5-flash-image", - "name": "Gemini 2.5 Flash Image", - "display_name": "Gemini 2.5 Flash Image", + "id": "deepseek/deepseek-r1-0528", + "name": "DeepSeek: R1 0528", + "display_name": "DeepSeek: R1 0528", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 163840, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-22", - "last_updated": "2025-10-22", - "type": "imageGeneration" + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-05-28", + "last_updated": "2026-03-15", + "cost": { + "input": 0.45, + "output": 2.15, + "cache_read": 0.2 + }, + "type": "chat" }, { - "id": "glm-4.5", - "name": "GLM 4.5", - "display_name": "GLM 4.5", + "id": "deepseek/deepseek-v3.2-speciale", + "name": "DeepSeek: DeepSeek V3.2 Speciale", + "display_name": "DeepSeek: DeepSeek V3.2 Speciale", "modalities": { "input": [ "text" @@ -52673,37 +53462,41 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 163840, + "output": 163840 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "release_date": "2025-12-01", + "last_updated": "2026-03-15", + "cost": { + "input": 0.4, + "output": 1.2, + "cache_read": 0.135 + }, "type": "chat" }, { - "id": "claude-3.5-sonnet", - "name": "Claude 3.5 Sonnet", - "display_name": "Claude 3.5 Sonnet", + "id": "deepseek/deepseek-v3.2", + "name": "DeepSeek: DeepSeek V3.2", + "display_name": "DeepSeek: DeepSeek V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8200 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -52711,45 +53504,58 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-09", - "last_updated": "2025-09-09", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-01", + "last_updated": "2026-03-15", + "cost": { + "input": 0.26, + "output": 0.38, + "cache_read": 0.125 + }, "type": "chat" }, { - "id": "claude-4.0-sonnet", - "name": "Claude 4.0 Sonnet", - "display_name": "Claude 4.0 Sonnet", + "id": "deepseek/deepseek-v4-flash:free", + "name": "DeepSeek: DeepSeek V4 Flash (free)", + "display_name": "DeepSeek: DeepSeek V4 Flash (free)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 384000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-04-24", + "last_updated": "2026-05-16", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b-instruct-2507", - "name": "Qwen3 30b A3b Instruct 2507", - "display_name": "Qwen3 30b A3b Instruct 2507", + "id": "deepseek/deepseek-v4-flash", + "name": "DeepSeek: DeepSeek V4 Flash", + "display_name": "DeepSeek: DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -52759,37 +53565,52 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 1048576, + "output": 384000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2026-02-04", - "last_updated": "2026-02-04", + "release_date": "2026-04-24", + "last_updated": "2026-05-01", + "cost": { + "input": 0.14, + "output": 0.28, + "cache_read": 0.0028 + }, "type": "chat" }, { - "id": "doubao-seed-1.6-thinking", - "name": "Doubao-Seed 1.6 Thinking", - "display_name": "Doubao-Seed 1.6 Thinking", + "id": "deepseek/deepseek-chat-v3-0324", + "name": "DeepSeek: DeepSeek V3 0324", + "display_name": "DeepSeek: DeepSeek V3 0324", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -52797,67 +53618,59 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-15", - "last_updated": "2025-08-15", + "attachment": false, + "open_weights": true, + "release_date": "2025-03-24", + "last_updated": "2026-03-15", + "cost": { + "input": 0.2, + "output": 0.77, + "cache_read": 0.095 + }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "deepseek/deepseek-r1-distill-llama-70b", + "name": "DeepSeek: R1 Distill Llama 70B", + "display_name": "DeepSeek: R1 Distill Llama 70B", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 64000 + "context": 131072, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-01-23", + "last_updated": "2026-03-15", + "cost": { + "input": 0.7, + "output": 0.8, + "cache_read": 0.015 + }, "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "deepseek/deepseek-r1-distill-qwen-32b", + "name": "DeepSeek: R1 Distill Qwen 32B", + "display_name": "DeepSeek: R1 Distill Qwen 32B", "modalities": { "input": [ "text" @@ -52867,36 +53680,29 @@ ] }, "limit": { - "context": 262144, - "output": 4096 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-12", - "last_updated": "2025-08-12", + "open_weights": true, + "release_date": "2025-01-01", + "last_updated": "2025-11-25", + "cost": { + "input": 0.29, + "output": 0.29 + }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "deepseek/deepseek-chat-v3.1", + "name": "DeepSeek: DeepSeek V3.1", + "display_name": "DeepSeek: DeepSeek V3.1", "modalities": { "input": [ "text" @@ -52906,8 +53712,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 32768, + "output": 7168 }, "temperature": true, "tool_call": true, @@ -52915,27 +53721,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-12", - "last_updated": "2025-09-12", + "open_weights": true, + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "cost": { + "input": 0.15, + "output": 0.75 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b-thinking-2507", - "name": "Qwen3 30b A3b Thinking 2507", - "display_name": "Qwen3 30b A3b Thinking 2507", + "id": "deepseek/deepseek-v3.1-terminus", + "name": "DeepSeek: DeepSeek V3.1 Terminus", + "display_name": "DeepSeek: DeepSeek V3.1 Terminus", "modalities": { "input": [ "text" @@ -52945,8 +53744,8 @@ ] }, "limit": { - "context": 126000, - "output": 32000 + "context": 163840, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -52954,55 +53753,53 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-04", - "last_updated": "2026-02-04", + "open_weights": true, + "release_date": "2025-09-22", + "last_updated": "2025-09-22", + "cost": { + "input": 0.21, + "output": 0.79, + "cache_read": 0.13 + }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "perplexity/sonar", + "name": "Perplexity: Sonar", + "display_name": "Perplexity: Sonar", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 4096 + "context": 127072, + "output": 25415 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", + "cost": { + "input": 1, + "output": 1 + }, "type": "chat" }, { - "id": "deepseek-v3.1", - "name": "DeepSeek-V3.1", - "display_name": "DeepSeek-V3.1", + "id": "perplexity/sonar-deep-research", + "name": "Perplexity: Sonar Deep Research", + "display_name": "Perplexity: Sonar Deep Research", "modalities": { "input": [ "text" @@ -53013,67 +53810,65 @@ }, "limit": { "context": 128000, - "output": 32000 + "output": 25600 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-08-19", - "last_updated": "2025-08-19", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", + "cost": { + "input": 2, + "output": 8 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "perplexity/sonar-reasoning-pro", + "name": "Perplexity: Sonar Reasoning Pro", + "display_name": "Perplexity: Sonar Reasoning Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 40000, - "output": 4096 + "context": 128000, + "output": 25600 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", + "cost": { + "input": 2, + "output": 8 + }, "type": "chat" }, { - "id": "claude-4.1-opus", - "name": "Claude 4.1 Opus", - "display_name": "Claude 4.1 Opus", + "id": "perplexity/sonar-pro-search", + "name": "Perplexity: Sonar Pro Search", + "display_name": "Perplexity: Sonar Pro Search", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" @@ -53081,54 +53876,60 @@ }, "limit": { "context": 200000, - "output": 32000 + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", + "release_date": "2025-10-31", + "last_updated": "2026-03-15", + "cost": { + "input": 3, + "output": 15 + }, "type": "chat" }, { - "id": "doubao-seed-2.0-mini", - "name": "Doubao Seed 2.0 Mini", - "display_name": "Doubao Seed 2.0 Mini", + "id": "perplexity/sonar-pro", + "name": "Perplexity: Sonar Pro", + "display_name": "Perplexity: Sonar Pro", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 200000, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", + "cost": { + "input": 3, + "output": 15 + }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "ai21/jamba-large-1.7", + "name": "AI21: Jamba Large 1.7", + "display_name": "AI21: Jamba Large 1.7", "modalities": { "input": [ "text" @@ -53138,8 +53939,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 256000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -53148,58 +53949,61 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-09-12", - "last_updated": "2025-09-12", + "release_date": "2025-08-09", + "last_updated": "2026-03-15", + "cost": { + "input": 2, + "output": 8 + }, "type": "chat" }, { - "id": "doubao-seed-1.6", - "name": "Doubao-Seed 1.6", - "display_name": "Doubao-Seed 1.6", + "id": "meta-llama/llama-3.1-70b-instruct", + "name": "Meta: Llama 3.1 70B Instruct", + "display_name": "Meta: Llama 3.1 70B Instruct", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 131072, + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-07-16", + "last_updated": "2024-07-23", + "cost": { + "input": 0.4, + "output": 0.4 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-15", - "last_updated": "2025-08-15", "type": "chat" }, { - "id": "qwen2.5-vl-7b-instruct", - "name": "Qwen 2.5 VL 7B Instruct", - "display_name": "Qwen 2.5 VL 7B Instruct", + "id": "meta-llama/llama-4-scout", + "name": "Meta: Llama 4 Scout", + "display_name": "Meta: Llama 4 Scout", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 327680, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -53207,44 +54011,50 @@ "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "cost": { + "input": 0.08, + "output": 0.3 + }, "type": "chat" }, { - "id": "kling-v2-6", - "name": "Kling-V2 6", - "display_name": "Kling-V2 6", + "id": "meta-llama/llama-3.2-1b-instruct", + "name": "Meta: Llama 3.2 1B Instruct", + "display_name": "Meta: Llama 3.2 1B Instruct", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 99999999, - "output": 99999999 + "context": 60000, + "output": 12000 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-01-13", - "last_updated": "2026-01-13", + "attachment": false, + "open_weights": true, + "release_date": "2024-09-18", + "last_updated": "2026-01-27", + "cost": { + "input": 0.027, + "output": 0.2 + }, "type": "chat" }, { - "id": "MiniMax-M1", - "name": "MiniMax M1", - "display_name": "MiniMax M1", + "id": "meta-llama/llama-guard-3-8b", + "name": "Llama Guard 3 8B", + "display_name": "Llama Guard 3 8B", "modalities": { "input": [ "text" @@ -53254,104 +54064,91 @@ ] }, "limit": { - "context": 1000000, - "output": 80000 + "context": 131072, + "output": 26215 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "release_date": "2024-04-18", + "last_updated": "2026-02-04", + "cost": { + "input": 0.02, + "output": 0.06 + }, "type": "chat" }, { - "id": "gemini-3.0-pro-preview", - "name": "Gemini 3.0 Pro Preview", - "display_name": "Gemini 3.0 Pro Preview", + "id": "meta-llama/llama-3-70b-instruct", + "name": "Meta: Llama 3 70B Instruct", + "display_name": "Meta: Llama 3 70B Instruct", "modalities": { "input": [ - "text", - "image", - "video", - "pdf", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 8192, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0.51, + "output": 0.74 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", "type": "chat" }, { - "id": "doubao-seed-2.0-lite", - "name": "Doubao Seed 2.0 Lite", - "display_name": "Doubao Seed 2.0 Lite", + "id": "meta-llama/llama-3.2-11b-vision-instruct", + "name": "Meta: Llama 3.2 11B Vision Instruct", + "display_name": "Meta: Llama 3.2 11B Vision Instruct", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 131072, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "open_weights": true, + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "cost": { + "input": 0.049, + "output": 0.049 + }, "type": "chat" }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "meta-llama/llama-3-8b-instruct", + "name": "Meta: Llama 3 8B Instruct", + "display_name": "Meta: Llama 3 8B Instruct", "modalities": { "input": [ "text" @@ -53361,8 +54158,8 @@ ] }, "limit": { - "context": 262000, - "output": 4096 + "context": 8192, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -53370,15 +54167,19 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-14", - "last_updated": "2025-08-14", + "open_weights": true, + "release_date": "2024-04-25", + "last_updated": "2025-04-03", + "cost": { + "input": 0.03, + "output": 0.04 + }, "type": "chat" }, { - "id": "claude-3.5-haiku", - "name": "Claude 3.5 Haiku", - "display_name": "Claude 3.5 Haiku", + "id": "meta-llama/llama-4-maverick", + "name": "Meta: Llama 4 Maverick", + "display_name": "Meta: Llama 4 Maverick", "modalities": { "input": [ "text", @@ -53389,8 +54190,8 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 1048576, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -53398,15 +54199,19 @@ "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-12-24", + "cost": { + "input": 0.15, + "output": 0.6 + }, "type": "chat" }, { - "id": "gpt-oss-20b", - "name": "gpt-oss-20b", - "display_name": "gpt-oss-20b", + "id": "meta-llama/llama-3.3-70b-instruct", + "name": "Meta: Llama 3.3 70B Instruct", + "display_name": "Meta: Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -53416,30 +54221,28 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", + "open_weights": true, + "release_date": "2024-08-01", + "last_updated": "2026-02-04", + "cost": { + "input": 0.1, + "output": 0.32 + }, "type": "chat" }, { - "id": "qwen-turbo", - "name": "Qwen-Turbo", - "display_name": "Qwen-Turbo", + "id": "meta-llama/llama-3.2-3b-instruct", + "name": "Meta: Llama 3.2 3B Instruct", + "display_name": "Meta: Llama 3.2 3B Instruct", "modalities": { "input": [ "text" @@ -53449,38 +54252,31 @@ ] }, "limit": { - "context": 1000000, - "output": 4096 + "context": 80000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "release_date": "2024-09-18", + "last_updated": "2026-03-15", + "cost": { + "input": 0.051, + "output": 0.34 + }, "type": "chat" }, { - "id": "kimi-k2", - "name": "Kimi K2", - "display_name": "Kimi K2", + "id": "meta-llama/llama-guard-4-12b", + "name": "Meta: Llama Guard 4 12B", + "display_name": "Meta: Llama Guard 4 12B", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -53488,76 +54284,62 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 163840, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "cost": { + "input": 0.18, + "output": 0.18 + }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "meta-llama/llama-3.1-8b-instruct", + "name": "Meta: Llama 3.1 8B Instruct", + "display_name": "Meta: Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 64000 + "context": 16384, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2025-12-23", + "cost": { + "input": 0.02, + "output": 0.05 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", "type": "chat" }, { - "id": "qwen3-max-preview", - "name": "Qwen3 Max Preview", - "display_name": "Qwen3 Max Preview", + "id": "arcee-ai/spotlight", + "name": "Arcee AI: Spotlight", + "display_name": "Arcee AI: Spotlight", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -53565,35 +54347,28 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 131072, + "output": 65537 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": true, + "open_weights": true, + "release_date": "2025-05-06", + "last_updated": "2026-03-15", + "cost": { + "input": 0.18, + "output": 0.18 }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-06", - "last_updated": "2025-09-06", "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "arcee-ai/trinity-mini", + "name": "Arcee AI: Trinity Mini", + "display_name": "Arcee AI: Trinity Mini", "modalities": { "input": [ "text" @@ -53603,8 +54378,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -53612,79 +54387,82 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", + "open_weights": true, + "release_date": "2025-12", + "last_updated": "2026-01-28", + "cost": { + "input": 0.045, + "output": 0.15 + }, "type": "chat" }, { - "id": "doubao-1.5-vision-pro", - "name": "Doubao 1.5 Vision Pro", - "display_name": "Doubao 1.5 Vision Pro", + "id": "arcee-ai/maestro-reasoning", + "name": "Arcee AI: Maestro Reasoning", + "display_name": "Arcee AI: Maestro Reasoning", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 131072, + "output": 32000 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-05-06", + "last_updated": "2026-03-15", + "cost": { + "input": 0.9, + "output": 3.3 + }, "type": "chat" }, { - "id": "claude-4.5-sonnet", - "name": "Claude 4.5 Sonnet", - "display_name": "Claude 4.5 Sonnet", + "id": "arcee-ai/coder-large", + "name": "Arcee AI: Coder Large", + "display_name": "Arcee AI: Coder Large", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-05-06", + "last_updated": "2026-03-15", + "cost": { + "input": 0.5, + "output": 0.8 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", "type": "chat" }, { - "id": "deepseek-v3", - "name": "DeepSeek-V3", - "display_name": "DeepSeek-V3", + "id": "arcee-ai/virtuoso-large", + "name": "Arcee AI: Virtuoso Large", + "display_name": "Arcee AI: Virtuoso Large", "modalities": { "input": [ "text" @@ -53694,24 +54472,28 @@ ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 131072, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-13", - "last_updated": "2025-08-13", + "open_weights": true, + "release_date": "2025-05-06", + "last_updated": "2026-03-15", + "cost": { + "input": 0.75, + "output": 1.2 + }, "type": "chat" }, { - "id": "deepseek-r1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "arcee-ai/trinity-large-thinking", + "name": "Arcee AI: Trinity Large Thinking", + "display_name": "Arcee AI: Trinity Large Thinking", "modalities": { "input": [ "text" @@ -53721,8 +54503,8 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -53730,41 +54512,63 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2026-04-01", + "last_updated": "2026-04-11", + "cost": { + "input": 0.22, + "output": 0.85 + }, + "type": "chat" + }, + { + "id": "arcee-ai/trinity-large-preview", + "name": "Arcee AI: Trinity Large Preview", + "display_name": "Arcee AI: Trinity Large Preview", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131000, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-01-28", + "last_updated": "2026-05-01", + "cost": { + "input": 0.15, + "output": 0.45 + }, "type": "chat" }, { - "id": "gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash Lite", - "display_name": "Gemini 2.0 Flash Lite", + "id": "kilo-auto/frontier", + "name": "Kilo Auto Frontier", + "display_name": "Kilo Auto Frontier", "modalities": { "input": [ - "text", "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -53774,14 +54578,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-03-15", + "last_updated": "2026-03-15", + "cost": { + "input": 5, + "output": 25 + }, "type": "chat" }, { - "id": "qwen-max-2025-01-25", - "name": "Qwen2.5-Max-2025-01-25", - "display_name": "Qwen2.5-Max-2025-01-25", + "id": "kilo-auto/balanced", + "name": "Kilo Auto Balanced", + "display_name": "Kilo Auto Balanced", "modalities": { "input": [ "text" @@ -53791,36 +54599,40 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-03-15", + "last_updated": "2026-03-15", + "cost": { + "input": 0.6, + "output": 3 + }, "type": "chat" }, { - "id": "doubao-seed-2.0-pro", - "name": "Doubao Seed 2.0 Pro", - "display_name": "Doubao Seed 2.0 Pro", + "id": "kilo-auto/small", + "name": "Kilo Auto Small", + "display_name": "Kilo Auto Small", "modalities": { "input": [ - "text", "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 400000, "output": 128000 }, "temperature": true, @@ -53831,14 +54643,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "release_date": "2026-03-15", + "last_updated": "2026-03-15", + "cost": { + "input": 0.05, + "output": 0.4 + }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-exp-thinking", - "name": "DeepSeek/DeepSeek-V3.2-Exp-Thinking", - "display_name": "DeepSeek/DeepSeek-V3.2-Exp-Thinking", + "id": "kilo-auto/free", + "name": "Kilo Auto Free", + "display_name": "Kilo Auto Free", "modalities": { "input": [ "text" @@ -53848,25 +54664,29 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 204800, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2026-03-15", + "last_updated": "2026-03-15", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1-terminus-thinking", - "name": "DeepSeek/DeepSeek-V3.1-Terminus-Thinking", - "display_name": "DeepSeek/DeepSeek-V3.1-Terminus-Thinking", + "id": "essentialai/rnj-1-instruct", + "name": "EssentialAI: Rnj 1 Instruct", + "display_name": "EssentialAI: Rnj 1 Instruct", "modalities": { "input": [ "text" @@ -53876,25 +54696,60 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 32768, + "output": 6554 }, "temperature": true, - "tool_call": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-05", + "last_updated": "2026-03-15", + "cost": { + "input": 0.15, + "output": 0.15 + }, + "type": "chat" + }, + { + "id": "alibaba/tongyi-deepresearch-30b-a3b", + "name": "Tongyi DeepResearch 30B A3B", + "display_name": "Tongyi DeepResearch 30B A3B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "release_date": "2025-09-18", + "last_updated": "2026-03-15", + "cost": { + "input": 0.09, + "output": 0.45 + }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-exp", - "name": "DeepSeek/DeepSeek-V3.2-Exp", - "display_name": "DeepSeek/DeepSeek-V3.2-Exp", + "id": "stepfun/step-3.5-flash", + "name": "StepFun: Step 3.5 Flash", + "display_name": "StepFun: Step 3.5 Flash", "modalities": { "input": [ "text" @@ -53904,24 +54759,30 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": true, + "release_date": "2026-01-29", + "last_updated": "2026-01-29", + "cost": { + "input": 0.1, + "output": 0.3, + "cache_read": 0.02 + }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-251201", - "name": "Deepseek/DeepSeek-V3.2", - "display_name": "Deepseek/DeepSeek-V3.2", + "id": "stepfun/step-3.5-flash:free", + "name": "StepFun: Step 3.5 Flash (free)", + "display_name": "StepFun: Step 3.5 Flash (free)", "modalities": { "input": [ "text" @@ -53931,8 +54792,8 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -53942,25 +54803,31 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2025-08-26", + "last_updated": "2026-05-01", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "deepseek/deepseek-math-v2", - "name": "Deepseek/Deepseek-Math-V2", - "display_name": "Deepseek/Deepseek-Math-V2", + "id": "perceptron/perceptron-mk1", + "name": "Perceptron: Perceptron Mk1", + "display_name": "Perceptron: Perceptron Mk1", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 160000, - "output": 160000 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": false, @@ -53968,21 +54835,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-04", - "last_updated": "2025-12-04", + "release_date": "2026-05-12", + "last_updated": "2026-05-16", + "cost": { + "input": 0.15, + "output": 1.5 + }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1-terminus", - "name": "DeepSeek/DeepSeek-V3.1-Terminus", - "display_name": "DeepSeek/DeepSeek-V3.1-Terminus", + "id": "allenai/olmo-3-32b-think", + "name": "AllenAI: Olmo 3 32B Think", + "display_name": "AllenAI: Olmo 3 32B Think", "modalities": { "input": [ "text" @@ -53992,113 +54858,130 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 65536, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "open_weights": true, + "release_date": "2025-11-22", + "last_updated": "2026-03-15", + "cost": { + "input": 0.15, + "output": 0.5 + }, "type": "chat" }, { - "id": "stepfun-ai/gelab-zero-4b-preview", - "name": "Stepfun-Ai/Gelab Zero 4b Preview", - "display_name": "Stepfun-Ai/Gelab Zero 4b Preview", + "id": "rekaai/reka-flash-3", + "name": "Reka Flash 3", + "display_name": "Reka Flash 3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 65536, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-03-12", + "last_updated": "2026-04-11", + "cost": { + "input": 0.1, + "output": 0.2 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", "type": "chat" }, { - "id": "stepfun/step-3.5-flash", - "name": "Stepfun/Step-3.5 Flash", - "display_name": "Stepfun/Step-3.5 Flash", + "id": "rekaai/reka-edge", + "name": "Reka Edge", + "display_name": "Reka Edge", "modalities": { "input": [ + "image", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 4096 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-02-02", - "last_updated": "2026-02-02", + "open_weights": true, + "release_date": "2026-03-20", + "last_updated": "2026-04-11", + "cost": { + "input": 0.1, + "output": 0.1 + }, "type": "chat" }, { - "id": "x-ai/grok-4-fast", - "name": "x-AI/Grok-4-Fast", - "display_name": "x-AI/Grok-4-Fast", + "id": "baidu/qianfan-ocr-fast", + "name": "Baidu: Qianfan-OCR-Fast", + "display_name": "Baidu: Qianfan-OCR-Fast", "modalities": { "input": [ - "text", "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 65536, + "output": 28672 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-09-20", - "last_updated": "2025-09-20", + "release_date": "2026-04-20", + "last_updated": "2026-05-16", + "cost": { + "input": 0.68, + "output": 2.81 + }, "type": "chat" }, { - "id": "x-ai/grok-code-fast-1", - "name": "x-AI/Grok-Code-Fast 1", - "display_name": "x-AI/Grok-Code-Fast 1", + "id": "baidu/ernie-4.5-vl-424b-a47b", + "name": "Baidu: ERNIE 4.5 VL 424B A47B ", + "display_name": "Baidu: ERNIE 4.5 VL 424B A47B ", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -54106,97 +54989,91 @@ ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 123000, + "output": 16000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "attachment": true, + "open_weights": true, + "release_date": "2025-06-30", + "last_updated": "2026-01", + "cost": { + "input": 0.42, + "output": 1.25 }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-02", - "last_updated": "2025-09-02", "type": "chat" }, { - "id": "x-ai/grok-4-fast-reasoning", - "name": "X-Ai/Grok-4-Fast-Reasoning", - "display_name": "X-Ai/Grok-4-Fast-Reasoning", + "id": "baidu/ernie-4.5-21b-a3b", + "name": "Baidu: ERNIE 4.5 21B A3B", + "display_name": "Baidu: ERNIE 4.5 21B A3B", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 120000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "attachment": false, + "open_weights": true, + "release_date": "2025-06-30", + "last_updated": "2025-06-30", + "cost": { + "input": 0.07, + "output": 0.28 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-18", - "last_updated": "2025-12-18", "type": "chat" }, { - "id": "x-ai/grok-4.1-fast-non-reasoning", - "name": "X-Ai/Grok 4.1 Fast Non Reasoning", - "display_name": "X-Ai/Grok 4.1 Fast Non Reasoning", + "id": "baidu/ernie-4.5-300b-a47b", + "name": "Baidu: ERNIE 4.5 300B A47B ", + "display_name": "Baidu: ERNIE 4.5 300B A47B ", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 123000, + "output": 12000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-06-30", + "last_updated": "2026-01", + "cost": { + "input": 0.28, + "output": 1.1 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-19", - "last_updated": "2025-12-19", "type": "chat" }, { - "id": "x-ai/grok-4.1-fast", - "name": "x-AI/Grok-4.1-Fast", - "display_name": "x-AI/Grok-4.1-Fast", + "id": "baidu/ernie-4.5-21b-a3b-thinking", + "name": "Baidu: ERNIE 4.5 21B A3B Thinking", + "display_name": "Baidu: ERNIE 4.5 21B A3B Thinking", "modalities": { "input": [ "text" @@ -54206,70 +55083,73 @@ ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 131072, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-11-20", - "last_updated": "2025-11-20", + "open_weights": true, + "release_date": "2025-09-19", + "last_updated": "2025-09-19", + "cost": { + "input": 0.07, + "output": 0.28 + }, "type": "chat" }, { - "id": "x-ai/grok-4-fast-non-reasoning", - "name": "X-Ai/Grok-4-Fast-Non-Reasoning", - "display_name": "X-Ai/Grok-4-Fast-Non-Reasoning", + "id": "baidu/cobuddy:free", + "name": "Baidu: CoBuddy (free)", + "display_name": "Baidu: CoBuddy (free)", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 131072, + "output": 65536 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-18", - "last_updated": "2025-12-18", + "release_date": "2026-05-06", + "last_updated": "2026-05-07", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "x-ai/grok-4.1-fast-reasoning", - "name": "X-Ai/Grok 4.1 Fast Reasoning", - "display_name": "X-Ai/Grok 4.1 Fast Reasoning", + "id": "baidu/ernie-4.5-vl-28b-a3b", + "name": "Baidu: ERNIE 4.5 VL 28B A3B", + "display_name": "Baidu: ERNIE 4.5 VL 28B A3B", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 20000000, - "output": 2000000 + "context": 30000, + "output": 8000 }, "temperature": true, "tool_call": true, @@ -54278,66 +55158,51 @@ "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2025-12-19", - "last_updated": "2025-12-19", + "open_weights": true, + "release_date": "2025-06-30", + "last_updated": "2025-06-30", + "cost": { + "input": 0.14, + "output": 0.56 + }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "OpenAI/GPT-5.2", - "display_name": "OpenAI/GPT-5.2", + "id": "poolside/laguna-xs.2:free", + "name": "Poolside: Laguna XS.2 (free)", + "display_name": "Poolside: Laguna XS.2 (free)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2026-04-28", + "last_updated": "2026-05-01", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "openai/gpt-5", - "name": "OpenAI/GPT-5", - "display_name": "OpenAI/GPT-5", + "id": "poolside/laguna-m.1:free", + "name": "Poolside: Laguna M.1 (free)", + "display_name": "Poolside: Laguna M.1 (free)", "modalities": { "input": [ "text" @@ -54347,8 +55212,8 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -54356,48 +55221,35 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": false, "open_weights": false, - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "release_date": "2026-04-28", + "last_updated": "2026-05-01", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "z-ai/glm-4.7", - "name": "Z-Ai/GLM 4.7", - "display_name": "Z-Ai/GLM 4.7", + "id": "xiaomi/mimo-v2-omni", + "name": "Xiaomi: MiMo-V2-Omni", + "display_name": "Xiaomi: MiMo-V2-Omni", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -54405,27 +55257,22 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0.4, + "output": 2, + "cache_read": 0.08 + }, "type": "chat" }, { - "id": "z-ai/glm-5", - "name": "Z-Ai/GLM 5", - "display_name": "Z-Ai/GLM 5", + "id": "xiaomi/mimo-v2.5-pro", + "name": "Xiaomi: MiMo V2.5 Pro", + "display_name": "Xiaomi: MiMo V2.5 Pro", "modalities": { "input": [ "text" @@ -54435,8 +55282,8 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -54456,43 +55303,71 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", + "cost": { + "input": 1, + "output": 3, + "cache_read": 0.2, + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ] + }, "type": "chat" }, { - "id": "z-ai/autoglm-phone-9b", - "name": "Z-Ai/Autoglm Phone 9b", - "display_name": "Z-Ai/Autoglm Phone 9b", + "id": "xiaomi/mimo-v2-flash", + "name": "Xiaomi: MiMo-V2-Flash", + "display_name": "Xiaomi: MiMo-V2-Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 12800, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", + "cost": { + "input": 0.09, + "output": 0.29, + "cache_read": 0.045 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", "type": "chat" }, { - "id": "z-ai/glm-4.6", - "name": "Z-AI/GLM 4.6", - "display_name": "Z-AI/GLM 4.6", + "id": "xiaomi/mimo-v2-pro", + "name": "Xiaomi: MiMo-V2-Pro", + "display_name": "Xiaomi: MiMo-V2-Pro", "modalities": { "input": [ "text" @@ -54502,40 +55377,61 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-10-11", - "last_updated": "2025-10-11", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 1, + "output": 3, + "cache_read": 0.2, + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ] + }, "type": "chat" }, { - "id": "minimax/minimax-m2", - "name": "Minimax/Minimax-M2", - "display_name": "Minimax/Minimax-M2", + "id": "xiaomi/mimo-v2.5", + "name": "Xiaomi: MiMo-V2.5", + "display_name": "Xiaomi: MiMo-V2.5", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -54545,19 +55441,56 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-10-28", - "last_updated": "2025-10-28", + "attachment": true, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", + "cost": { + "input": 0.4, + "output": 2, + "cache_read": 0.08, + "context_over_200k": { + "input": 0.8, + "output": 4, + "cache_read": 0.16 + }, + "tiers": [ + { + "input": 0.8, + "output": 4, + "cache_read": 0.16, + "tier": { + "type": "context", + "size": 256000 + } + } + ] + }, "type": "chat" - }, + } + ] + }, + "lmstudio": { + "id": "lmstudio", + "name": "LMStudio", + "display_name": "LMStudio", + "api": "http://127.0.0.1:1234/v1", + "doc": "https://lmstudio.ai/models", + "models": [ { - "id": "minimax/minimax-m2.1", - "name": "Minimax/Minimax-M2.1", - "display_name": "Minimax/Minimax-M2.1", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -54567,8 +55500,8 @@ ] }, "limit": { - "context": 204800, - "output": 128000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -54582,15 +55515,19 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "minimax/minimax-m2.5", - "name": "Minimax/Minimax-M2.5", - "display_name": "Minimax/Minimax-M2.5", + "id": "qwen/qwen3-coder-30b", + "name": "Qwen3 Coder 30B", + "display_name": "Qwen3 Coder 30B", "modalities": { "input": [ "text" @@ -54600,30 +55537,29 @@ ] }, "limit": { - "context": 204800, - "output": 128000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "minimax/minimax-m2.5-highspeed", - "name": "Minimax/Minimax-M2.5 Highspeed", - "display_name": "Minimax/Minimax-M2.5 Highspeed", + "id": "qwen/qwen3-30b-a3b-2507", + "name": "Qwen3 30B A3B 2507", + "display_name": "Qwen3 30B A3B 2507", "modalities": { "input": [ "text" @@ -54633,48 +55569,89 @@ ] }, "limit": { - "context": 204800, - "output": 128000 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + } + ] + }, + "xiaomi-token-plan-cn": { + "id": "xiaomi-token-plan-cn", + "name": "Xiaomi Token Plan (China)", + "display_name": "Xiaomi Token Plan (China)", + "api": "https://token-plan-cn.xiaomimimo.com/v1", + "doc": "https://platform.xiaomimimo.com/#/docs", + "models": [ + { + "id": "mimo-v2-tts", + "name": "MiMo-V2-TTS", + "display_name": "MiMo-V2-TTS", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "limit": { + "context": 8192, + "output": 16384 + }, + "tool_call": false, + "reasoning": { + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.5", - "name": "Moonshotai/Kimi-K2.5", - "display_name": "Moonshotai/Kimi-K2.5", + "id": "mimo-v2-omni", + "name": "MiMo-V2-Omni", + "display_name": "MiMo-V2-Omni", "modalities": { "input": [ "text", "image", - "video" + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -54689,14 +55666,20 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-01-28", - "last_updated": "2026-01-28", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 + }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "mimo-v2.5-pro", + "name": "MiMo-V2.5-Pro", + "display_name": "MiMo-V2.5-Pro", "modalities": { "input": [ "text" @@ -54706,24 +55689,42 @@ ] }, "limit": { - "context": 256000, - "output": 100000 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-08", - "last_updated": "2025-09-08", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 + }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "mimo-v2-flash", + "name": "MiMo-V2-Flash", + "display_name": "MiMo-V2-Flash", "modalities": { "input": [ "text" @@ -54733,13 +55734,14 @@ ] }, "limit": { - "context": 256000, - "output": 100000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -54753,15 +55755,21 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-11-07", - "last_updated": "2025-11-07", + "open_weights": true, + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 + }, "type": "chat" }, { - "id": "meituan/longcat-flash-chat", - "name": "Meituan/Longcat-Flash-Chat", - "display_name": "Meituan/Longcat-Flash-Chat", + "id": "mimo-v2-pro", + "name": "MiMo-V2-Pro", + "display_name": "MiMo-V2-Pro", "modalities": { "input": [ "text" @@ -54771,62 +55779,110 @@ ] }, "limit": { - "context": 131072, + "context": 1048576, "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-11-05", - "last_updated": "2025-11-05", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 + }, "type": "chat" }, { - "id": "meituan/longcat-flash-lite", - "name": "Meituan/Longcat-Flash-Lite", - "display_name": "Meituan/Longcat-Flash-Lite", - "modalities": { - "input": [ - "text" + "id": "mimo-v2.5", + "name": "MiMo-V2.5", + "display_name": "MiMo-V2.5", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 320000 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 }, - "attachment": false, - "open_weights": false, - "release_date": "2026-02-06", - "last_updated": "2026-02-06", "type": "chat" - }, + } + ] + }, + "v0": { + "id": "v0", + "name": "v0", + "display_name": "v0", + "doc": "https://sdk.vercel.ai/providers/ai-sdk-providers/vercel", + "models": [ { - "id": "mimo-v2-flash", - "name": "Mimo-V2-Flash", - "display_name": "Mimo-V2-Flash", + "id": "v0-1.5-md", + "name": "v0-1.5-md", + "display_name": "v0-1.5-md", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -54834,33 +55890,32 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", + "attachment": true, + "open_weights": false, + "release_date": "2025-06-09", + "last_updated": "2025-06-09", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash", - "name": "Xiaomi/Mimo-V2-Flash", - "display_name": "Xiaomi/Mimo-V2-Flash", + "id": "v0-1.5-lg", + "name": "v0-1.5-lg", + "display_name": "v0-1.5-lg", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 512000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -54868,64 +55923,62 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", + "attachment": true, + "open_weights": false, + "release_date": "2025-06-09", + "last_updated": "2025-06-09", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01 + "input": 15, + "output": 75 }, "type": "chat" - } - ] - }, - "kilo": { - "id": "kilo", - "name": "Kilo Gateway", - "display_name": "Kilo Gateway", - "api": "https://api.kilo.ai/api/gateway", - "doc": "https://kilo.ai", - "models": [ + }, { - "id": "rekaai/reka-edge", - "name": "Reka Edge", - "display_name": "Reka Edge", + "id": "v0-1.0-md", + "name": "v0-1.0-md", + "display_name": "v0-1.0-md", "modalities": { "input": [ - "image", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2026-03-20", - "last_updated": "2026-04-11", + "open_weights": false, + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.1, - "output": 0.1 + "input": 3, + "output": 15 }, "type": "chat" - }, + } + ] + }, + "morph": { + "id": "morph", + "name": "Morph", + "display_name": "Morph", + "api": "https://api.morphllm.com/v1", + "doc": "https://docs.morphllm.com/api-reference/introduction", + "models": [ { - "id": "rekaai/reka-flash-3", - "name": "Reka Flash 3", - "display_name": "Reka Flash 3", + "id": "morph-v3-large", + "name": "Morph v3 Large", + "display_name": "Morph v3 Large", "modalities": { "input": [ "text" @@ -54935,29 +55988,28 @@ ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 32000, + "output": 32000 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-03-12", - "last_updated": "2026-04-11", + "open_weights": false, + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 0.1, - "output": 0.2 + "input": 0.9, + "output": 1.9 }, "type": "chat" }, { - "id": "ai21/jamba-large-1.7", - "name": "AI21: Jamba Large 1.7", - "display_name": "AI21: Jamba Large 1.7", + "id": "auto", + "name": "Auto", + "display_name": "Auto", "modalities": { "input": [ "text" @@ -54967,28 +56019,28 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 32000, + "output": 32000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-09", - "last_updated": "2026-03-15", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 2, - "output": 8 + "input": 0.85, + "output": 1.55 }, "type": "chat" }, { - "id": "alibaba/tongyi-deepresearch-30b-a3b", - "name": "Tongyi DeepResearch 30B A3B", - "display_name": "Tongyi DeepResearch 30B A3B", + "id": "morph-v3-fast", + "name": "Morph v3 Fast", + "display_name": "Morph v3 Fast", "modalities": { "input": [ "text" @@ -54998,60 +56050,68 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 16000, + "output": 16000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2026-03-15", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 0.09, - "output": 0.45 + "input": 0.8, + "output": 1.2 }, "type": "chat" - }, + } + ] + }, + "nearai": { + "id": "nearai", + "name": "NEAR AI Cloud", + "display_name": "NEAR AI Cloud", + "api": "https://cloud-api.near.ai/v1", + "doc": "https://docs.near.ai/", + "models": [ { - "id": "inflection/inflection-3-pi", - "name": "Inflection: Inflection 3 Pi", - "display_name": "Inflection: Inflection 3 Pi", + "id": "openai/whisper-large-v3", + "name": "Whisper Large v3", + "display_name": "Whisper Large v3", "modalities": { "input": [ - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 8000, - "output": 1024 + "context": 448, + "output": 448 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-10-11", - "last_updated": "2026-03-15", + "open_weights": true, + "release_date": "2023-11-06", + "last_updated": "2023-11-06", "cost": { - "input": 2.5, - "output": 10 + "input": 0.01, + "output": 0 }, "type": "chat" }, { - "id": "inflection/inflection-3-productivity", - "name": "Inflection: Inflection 3 Productivity", - "display_name": "Inflection: Inflection 3 Productivity", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS 120B", + "display_name": "GPT-OSS 120B", "modalities": { "input": [ "text" @@ -55061,28 +56121,34 @@ ] }, "limit": { - "context": 8000, - "output": 1024 + "context": 131000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2024-10-11", - "last_updated": "2026-03-15", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 2.5, - "output": 10 + "input": 0.15, + "output": 0.55 }, "type": "chat" }, { - "id": "liquid/lfm-2-24b-a2b", - "name": "LiquidAI: LFM2-24B-A2B", - "display_name": "LiquidAI: LFM2-24B-A2B", + "id": "zai-org/GLM-5.1-FP8", + "name": "GLM-5.1 FP8", + "display_name": "GLM-5.1 FP8", "modalities": { "input": [ "text" @@ -55092,39 +56158,52 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 202752, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-03-15", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.03, - "output": 0.12 + "input": 0.85, + "output": 3.3 }, "type": "chat" }, { - "id": "writer/palmyra-x5", - "name": "Writer: Palmyra X5", - "display_name": "Writer: Palmyra X5", + "id": "black-forest-labs/FLUX.2-klein-4B", + "name": "FLUX.2 Klein 4B", + "display_name": "FLUX.2 Klein 4B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 1040000, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": false, @@ -55132,19 +56211,19 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "open_weights": true, + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 0.6, - "output": 6 + "input": 1, + "output": 1 }, "type": "chat" }, { - "id": "ibm-granite/granite-4.1-8b", - "name": "IBM: Granite 4.1 8B", - "display_name": "IBM: Granite 4.1 8B", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen3 30B-A3B Instruct 2507", + "display_name": "Qwen3 30B-A3B Instruct 2507", "modalities": { "input": [ "text" @@ -55154,8 +56233,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -55163,20 +56242,19 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-05-01", + "open_weights": true, + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 0.05, - "output": 0.1, - "cache_read": 0.05 + "input": 0.15, + "output": 0.55 }, "type": "chat" }, { - "id": "ibm-granite/granite-4.0-h-micro", - "name": "IBM: Granite 4.0 Micro", - "display_name": "IBM: Granite 4.0 Micro", + "id": "Qwen/Qwen3-Embedding-0.6B", + "name": "Qwen3 Embedding 0.6B", + "display_name": "Qwen3 Embedding 0.6B", "modalities": { "input": [ "text" @@ -55186,28 +56264,28 @@ ] }, "limit": { - "context": 131000, - "output": 32768 + "context": 40960, + "output": 1024 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-10-20", - "last_updated": "2026-03-15", + "release_date": "2025-06-03", + "last_updated": "2025-06-03", "cost": { - "input": 0.017, - "output": 0.11 + "input": 0.01, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "essentialai/rnj-1-instruct", - "name": "EssentialAI: Rnj 1 Instruct", - "display_name": "EssentialAI: Rnj 1 Instruct", + "id": "Qwen/Qwen3-Reranker-0.6B", + "name": "Qwen3 Reranker 0.6B", + "display_name": "Qwen3 Reranker 0.6B", "modalities": { "input": [ "text" @@ -55217,28 +56295,28 @@ ] }, "limit": { - "context": 32768, - "output": 6554 + "context": 40960, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-05", - "last_updated": "2026-03-15", + "release_date": "2025-06-03", + "last_updated": "2025-06-03", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.01, + "output": 0.01 }, - "type": "chat" + "type": "rerank" }, { - "id": "perplexity/sonar-pro", - "name": "Perplexity: Sonar Pro", - "display_name": "Perplexity: Sonar Pro", + "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "name": "Qwen3-VL 30B-A3B Instruct", + "display_name": "Qwen3-VL 30B-A3B Instruct", "modalities": { "input": [ "text", @@ -55249,60 +56327,85 @@ ] }, "limit": { - "context": 200000, - "output": 8000 + "context": 256000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "open_weights": true, + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 3, - "output": 15 + "input": 0.15, + "output": 0.55 }, "type": "chat" }, { - "id": "perplexity/sonar-deep-research", - "name": "Perplexity: Sonar Deep Research", - "display_name": "Perplexity: Sonar Deep Research", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 25600 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-01-27", - "last_updated": "2025-01-27", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 2, - "output": 8 + "input": 1.8, + "output": 15.5, + "cache_read": 0.18 }, "type": "chat" }, { - "id": "perplexity/sonar", - "name": "Perplexity: Sonar", - "display_name": "Perplexity: Sonar", + "id": "openai/gpt-5.4-nano", + "name": "GPT-5.4 nano", + "display_name": "GPT-5.4 nano", "modalities": { "input": [ "text", @@ -55313,354 +56416,536 @@ ] }, "limit": { - "context": 127072, - "output": 25415 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 1, - "output": 1 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "perplexity/sonar-pro-search", - "name": "Perplexity: Sonar Pro Search", - "display_name": "Perplexity: Sonar Pro Search", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8000 + "context": 1047576, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-10-31", - "last_updated": "2026-03-15", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 3, - "output": 15 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "perplexity/sonar-reasoning-pro", - "name": "Perplexity: Sonar Reasoning Pro", - "display_name": "Perplexity: Sonar Reasoning Pro", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 25600 + "context": 1047576, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 2, - "output": 8 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "deepseek/deepseek-chat-v3.1", - "name": "DeepSeek: DeepSeek V3.1", - "display_name": "DeepSeek: DeepSeek V3.1", + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 7168 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.15, - "output": 0.75 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "deepseek/deepseek-chat", - "name": "DeepSeek: DeepSeek V3", - "display_name": "DeepSeek: DeepSeek V3", + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-12-01", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.32, - "output": 0.89, - "cache_read": 0.15 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-distill-llama-70b", - "name": "DeepSeek: R1 Distill Llama 70B", - "display_name": "DeepSeek: R1 Distill Llama 70B", + "id": "openai/gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1050000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-01-23", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.7, - "output": 0.8, - "cache_read": 0.015 + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + }, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "deepseek/deepseek-r1", - "name": "DeepSeek: R1", - "display_name": "DeepSeek: R1", + "id": "openai/gpt-5.4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.7, - "output": 2.5 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-speciale", - "name": "DeepSeek: DeepSeek V3.2 Speciale", - "display_name": "DeepSeek: DeepSeek V3.2 Speciale", + "id": "openai/gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 1050000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-01", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0.4, - "output": 1.2, - "cache_read": 0.135 + "input": 5, + "output": 30, + "cache_read": 0.5, + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + }, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-distill-qwen-32b", - "name": "DeepSeek: R1 Distill Qwen 32B", - "display_name": "DeepSeek: R1 Distill Qwen 32B", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 1047576, "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-01-01", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.29, - "output": 0.29 + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-exp", - "name": "DeepSeek: DeepSeek V3.2 Exp", - "display_name": "DeepSeek: DeepSeek V3.2 Exp", + "id": "openai/o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-01-01", - "last_updated": "2025-09-29", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.27, - "output": 0.41 + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-flash", - "name": "DeepSeek: DeepSeek V4 Flash", - "display_name": "DeepSeek: DeepSeek V4 Flash", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 384000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -55669,29 +56954,40 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-05-01", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.0028 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-pro", - "name": "DeepSeek: DeepSeek V4 Pro", - "display_name": "DeepSeek: DeepSeek V4 Pro", + "id": "openai/o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" @@ -55701,10 +56997,10 @@ ] }, "limit": { - "context": 1048576, - "output": 384000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -55713,42 +57009,48 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-05-01", + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 0.435, - "output": 0.87, - "cache_read": 0.003625 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2", - "name": "DeepSeek: DeepSeek V3.2", - "display_name": "DeepSeek: DeepSeek V3.2", + "id": "openai/o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -55756,68 +57058,103 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-01", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.26, - "output": 0.38, - "cache_read": 0.125 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "deepseek/deepseek-chat-v3-0324", - "name": "DeepSeek: DeepSeek V3 0324", - "display_name": "DeepSeek: DeepSeek V3 0324", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-03-24", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.2, - "output": 0.77, - "cache_read": 0.095 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-0528", - "name": "DeepSeek: R1 0528", - "display_name": "DeepSeek: R1 0528", + "id": "anthropic/claude-haiku-4-5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -55827,41 +57164,39 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-05-28", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.45, - "output": 2.15, - "cache_read": 0.2 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1-terminus", - "name": "DeepSeek: DeepSeek V3.1 Terminus", - "display_name": "DeepSeek: DeepSeek V3.1 Terminus", + "id": "anthropic/claude-sonnet-4-5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -55869,163 +57204,274 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.21, - "output": 0.79, - "cache_read": 0.13 + "input": 3, + "output": 15.5, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "openrouter/auto", - "name": "Auto Router", - "display_name": "Auto Router", + "id": "anthropic/claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image", + "pdf" ], "output": [ - "image", "text" ] }, "limit": { - "context": 2000000, - "output": 32768 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "openrouter/bodybuilder", - "name": "Body Builder (beta)", - "display_name": "Body Builder (beta)", + "id": "anthropic/claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1000000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openrouter/owl-alpha", - "name": "Owl Alpha", - "display_name": "Owl Alpha", + "id": "anthropic/claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 262144 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-04-28", - "last_updated": "2026-04-30", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openrouter/pareto-code", - "name": "Pareto Code Router", - "display_name": "Pareto Code Router", + "id": "google/gemini-3.1-flash-lite", + "name": "Gemini 3.1 Flash Lite", + "display_name": "Gemini 3.1 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 1048576, "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-04-21", - "last_updated": "2026-05-01", + "knowledge": "2025-01", + "release_date": "2026-05-07", + "last_updated": "2026-05-07", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "openrouter/free", - "name": "Free Models Router", - "display_name": "Free Models Router", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ + "text", "image", - "text" + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -56033,83 +57479,174 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-02-01", - "last_updated": "2026-03-15", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + }, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "inclusionai/ling-2.6-1t:free", - "name": "inclusionAI: Ling-2.6-1T (free)", - "display_name": "inclusionAI: Ling-2.6-1T (free)", + "id": "google/gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-04-23", - "last_updated": "2026-05-01", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.4, + "cache_read": 0.01, + "input_audio": 0.3 }, "type": "chat" }, { - "id": "inclusionai/ling-2.6-flash", - "name": "inclusionAI: Ling-2.6 Flash", - "display_name": "inclusionAI: Ling-2.6 Flash", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-04-21", - "last_updated": "2026-05-01", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.08, - "output": 0.24, - "cache_read": 0.016 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 }, "type": "chat" }, { - "id": "arcee-ai/trinity-mini", - "name": "Arcee AI: Trinity Mini", - "display_name": "Arcee AI: Trinity Mini", + "id": "Qwen/Qwen3.5-122B-A10B", + "name": "Qwen3.5 122B-A10B", + "display_name": "Qwen3.5 122B-A10B", "modalities": { "input": [ "text" @@ -56120,7 +57657,7 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -56128,54 +57665,79 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "release_date": "2025-12", - "last_updated": "2026-01-28", + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 0.045, - "output": 0.15 + "input": 0.4, + "output": 3.2 }, "type": "chat" - }, + } + ] + }, + "abacus": { + "id": "abacus", + "name": "Abacus", + "display_name": "Abacus", + "api": "https://routellm.abacus.ai/v1", + "doc": "https://abacus.ai/help/api", + "models": [ { - "id": "arcee-ai/virtuoso-large", - "name": "Arcee AI: Virtuoso Large", - "display_name": "Arcee AI: Virtuoso Large", + "id": "claude-opus-4-1-20250805", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 64000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-05-06", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.75, - "output": 1.2 + "input": 15, + "output": 75 }, "type": "chat" }, { - "id": "arcee-ai/trinity-large-thinking", - "name": "Arcee AI: Trinity Large Thinking", - "display_name": "Arcee AI: Trinity Large Thinking", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -56183,7 +57745,7 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -56191,287 +57753,395 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-11", + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.22, - "output": 0.85 + "input": 0.6, + "output": 3 }, "type": "chat" }, { - "id": "arcee-ai/spotlight", - "name": "Arcee AI: Spotlight", - "display_name": "Arcee AI: Spotlight", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65537 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-05-06", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.18, - "output": 0.18 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "arcee-ai/maestro-reasoning", - "name": "Arcee AI: Maestro Reasoning", - "display_name": "Arcee AI: Maestro Reasoning", + "id": "o3-pro", + "name": "o3-pro", + "display_name": "o3-pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32000 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-05-06", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", "cost": { - "input": 0.9, - "output": 3.3 + "input": 20, + "output": 40 }, "type": "chat" }, { - "id": "arcee-ai/coder-large", - "name": "Arcee AI: Coder Large", - "display_name": "Arcee AI: Coder Large", + "id": "claude-haiku-4-5-20251001", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-05-06", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.5, - "output": 0.8 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "arcee-ai/trinity-large-preview", - "name": "Arcee AI: Trinity Large Preview", - "display_name": "Arcee AI: Trinity Large Preview", + "id": "route-llm", + "name": "Route LLM", + "display_name": "Route LLM", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-01-28", - "last_updated": "2026-05-01", + "knowledge": "2024-10", + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 0.15, - "output": 0.45 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "deepcogito/cogito-v2.1-671b", - "name": "Deep Cogito: Cogito v2.1 671B", - "display_name": "Deep Cogito: Cogito v2.1 671B", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-11-14", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { "input": 1.25, - "output": 1.25 + "output": 10 }, "type": "chat" }, { - "id": "upstage/solar-pro-3", - "name": "Upstage: Solar Pro 3", - "display_name": "Upstage: Solar Pro 3", + "id": "grok-4-1-fast-non-reasoning", + "name": "Grok 4.1 Fast (Non-Reasoning)", + "display_name": "Grok 4.1 Fast (Non-Reasoning)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 2000000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-01-27", - "last_updated": "2026-03-15", + "release_date": "2025-11-17", + "last_updated": "2025-11-17", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "nex-agi/deepseek-v3.1-nex-n1", - "name": "Nex AGI: DeepSeek V3.1 Nex N1", - "display_name": "Nex AGI: DeepSeek V3.1 Nex N1", + "id": "grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 163840 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-11-25", + "release_date": "2025-09-01", + "last_updated": "2025-09-01", "cost": { - "input": 0.27, - "output": 1 + "input": 0.2, + "output": 1.5 }, "type": "chat" }, { - "id": "bytedance-seed/seed-1.6", - "name": "ByteDance Seed: Seed 1.6", - "display_name": "ByteDance Seed: Seed 1.6", + "id": "gpt-5-codex", + "name": "GPT-5 Codex", + "display_name": "GPT-5 Codex", "modalities": { "input": [ - "image", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-09", - "last_updated": "2025-09", + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.25, - "output": 2 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "bytedance-seed/seed-2.0-lite", - "name": "ByteDance Seed: Seed-2.0-Lite", - "display_name": "ByteDance Seed: Seed-2.0-Lite", + "id": "qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -56479,33 +58149,43 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2026-03-10", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.25, - "output": 2 + "input": 1.2, + "output": 6 }, "type": "chat" }, { - "id": "bytedance-seed/seed-1.6-flash", - "name": "ByteDance Seed: Seed 1.6 Flash", - "display_name": "ByteDance Seed: Seed 1.6 Flash", + "id": "grok-4-0709", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ - "image", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -56514,84 +58194,86 @@ "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2026-03-15", + "open_weights": false, + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.075, - "output": 0.3 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "bytedance-seed/seed-2.0-mini", - "name": "ByteDance Seed: Seed-2.0-Mini", - "display_name": "ByteDance Seed: Seed-2.0-Mini", + "id": "gpt-5.1-chat-latest", + "name": "GPT-5.1 Chat Latest", + "display_name": "GPT-5.1 Chat Latest", "modalities": { "input": [ - "image", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-27", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.1, - "output": 0.4 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "mancer/weaver", - "name": "Mancer: Weaver (alpha)", - "display_name": "Mancer: Weaver (alpha)", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 1047576, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2023-08-02", - "last_updated": "2026-03-15", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.75, - "output": 1 + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "anthracite-org/magnum-v4-72b", - "name": "Magnum v4 72B", - "display_name": "Magnum v4 72B", + "id": "llama-3.3-70b-versatile", + "name": "Llama 3.3 70B Versatile", + "display_name": "Llama 3.3 70B Versatile", "modalities": { "input": [ "text" @@ -56601,73 +58283,335 @@ ] }, "limit": { - "context": 16384, - "output": 2048 + "context": 128000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-10-22", - "last_updated": "2026-03-15", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 3, - "output": 5 + "input": 0.59, + "output": 0.79 }, "type": "chat" }, { - "id": "kilo-auto/balanced", - "name": "Kilo Auto Balanced", - "display_name": "Kilo Auto Balanced", + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ + "text", + "image", + "pdf" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 200000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", + "cost": { + "input": 3, + "output": 15 + }, + "type": "chat" + }, + { + "id": "gpt-4.1-mini", + "name": "GPT-4.1 Mini", + "display_name": "GPT-4.1 Mini", + "modalities": { + "input": [ + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 0.4, + "output": 1.6 + }, + "type": "chat" + }, + { + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.6, - "output": 3 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "kilo-auto/frontier", - "name": "Kilo Auto Frontier", - "display_name": "Kilo Auto Frontier", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "image", + "text", + "image" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.05, + "output": 0.4 + }, + "type": "chat" + }, + { + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", + "modalities": { + "input": [ + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 1050000, "output": 128000 }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", + "cost": { + "input": 2.5, + "output": 15 + }, + "type": "chat" + }, + { + "id": "gpt-4o-mini", + "name": "GPT-4o Mini", + "display_name": "GPT-4o Mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "cost": { + "input": 0.15, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "claude-opus-4-5-20251101", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 64000 + }, "temperature": true, "tool_call": true, "reasoning": { @@ -56676,8 +58620,9 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2025-03-31", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { "input": 5, "output": 25 @@ -56685,13 +58630,14 @@ "type": "chat" }, { - "id": "kilo-auto/small", - "name": "Kilo Auto Small", - "display_name": "Kilo Auto Small", + "id": "gpt-5.3-codex-xhigh", + "name": "GPT-5.3 Codex XHigh", + "display_name": "GPT-5.3 Codex XHigh", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" @@ -56701,37 +58647,95 @@ "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.05, - "output": 0.4 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "kilo-auto/free", - "name": "Kilo Auto Free", - "display_name": "Kilo Auto Free", + "id": "claude-opus-4-20250514", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ + "text", + "image", + "pdf" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 200000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-05-14", + "last_updated": "2025-05-14", + "cost": { + "input": 15, + "output": 75 + }, + "type": "chat" + }, + { + "id": "claude-sonnet-4-5-20250929", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", + "modalities": { + "input": [ + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -56739,20 +58743,21 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "undi95/remm-slerp-l2-13b", - "name": "ReMM SLERP 13B", - "display_name": "ReMM SLERP 13B", + "id": "qwen-2.5-coder-32b", + "name": "Qwen 2.5 Coder 32B", + "display_name": "Qwen 2.5 Coder 32B", "modalities": { "input": [ "text" @@ -56762,249 +58767,608 @@ ] }, "limit": { - "context": 6144, - "output": 4096 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2023-07-22", - "last_updated": "2026-03-15", + "release_date": "2024-11-11", + "last_updated": "2024-11-11", "cost": { - "input": 0.45, - "output": 0.65 + "input": 0.79, + "output": 0.79 }, "type": "chat" }, { - "id": "allenai/olmo-3-32b-think", - "name": "AllenAI: Olmo 3 32B Think", - "display_name": "AllenAI: Olmo 3 32B Think", + "id": "gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 65536, + "context": 1048576, "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-11-22", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-03-01", + "last_updated": "2026-03-01", "cost": { - "input": 0.15, - "output": 0.5 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "cache_write": 1 }, "type": "chat" }, { - "id": "nousresearch/hermes-2-pro-llama-3-8b", - "name": "NousResearch: Hermes 2 Pro - Llama-3 8B", - "display_name": "NousResearch: Hermes 2 Pro - Llama-3 8B", + "id": "gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-05-27", - "last_updated": "2024-06-27", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.14, - "output": 0.14 + "input": 2, + "output": 12 }, "type": "chat" }, { - "id": "nousresearch/hermes-4-405b", - "name": "Nous: Hermes 4 405B", - "display_name": "Nous: Hermes 4 405B", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ + "text", + "image" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 1.25, + "output": 10 + }, + "type": "chat" + }, + { + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-25", - "last_updated": "2025-08-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 1, + "input": 0.5, "output": 3 }, "type": "chat" }, { - "id": "nousresearch/hermes-3-llama-3.1-70b", - "name": "Nous: Hermes 3 70B Instruct", - "display_name": "Nous: Hermes 3 70B Instruct", + "id": "gpt-5.2-chat-latest", + "name": "GPT-5.2 Chat Latest", + "display_name": "GPT-5.2 Chat Latest", "modalities": { "input": [ + "text", + "image" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2026-01-01", + "last_updated": "2026-01-01", + "cost": { + "input": 1.75, + "output": 14 + }, + "type": "chat" + }, + { + "id": "gpt-4.1-nano", + "name": "GPT-4.1 Nano", + "display_name": "GPT-4.1 Nano", + "modalities": { + "input": [ + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 1047576, "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-08-18", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.3, - "output": 0.3 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "nousresearch/hermes-4-70b", - "name": "Nous: Hermes 4 70B", - "display_name": "Nous: Hermes 4 70B", + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-25", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.13, - "output": 0.4, - "cache_read": 0.055 + "input": 1.1, + "output": 4.4 }, "type": "chat" }, { - "id": "nousresearch/hermes-3-llama-3.1-405b", - "name": "Nous: Hermes 3 405B Instruct", - "display_name": "Nous: Hermes 3 405B Instruct", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ + "text", + "image" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 1.25, + "output": 10 + }, + "type": "chat" + }, + { + "id": "gpt-4o-2024-11-20", + "name": "GPT-4o (2024-11-20)", + "display_name": "GPT-4o (2024-11-20)", + "modalities": { + "input": [ + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 128000, "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-08-16", - "last_updated": "2024-08-16", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", "cost": { - "input": 1, - "output": 1 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "morph/morph-v3-fast", - "name": "Morph: Morph V3 Fast", - "display_name": "Morph: Morph V3 Fast", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ + "text", + "image", + "pdf" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 1.75, + "output": 14 + }, + "type": "chat" + }, + { + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 81920, - "output": 38000 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.8, - "output": 1.2 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "morph/morph-v3-large", - "name": "Morph: Morph V3 Large", - "display_name": "Morph: Morph V3 Large", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.25, + "output": 2 + }, + "type": "chat" + }, + { + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" @@ -57014,28 +59378,6042 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 0.9, - "output": 1.9 + "input": 1.1, + "output": 4.4 }, "type": "chat" }, { - "id": "stepfun/step-3.5-flash:free", - "name": "StepFun: Step 3.5 Flash (free)", - "display_name": "StepFun: Step 3.5 Flash (free)", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "cost": { + "input": 1.75, + "output": 14 + }, + "type": "chat" + }, + { + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "cost": { + "input": 5, + "output": 25 + }, + "type": "chat" + }, + { + "id": "claude-3-7-sonnet-20250219", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", + "cost": { + "input": 3, + "output": 15 + }, + "type": "chat" + }, + { + "id": "o3", + "name": "o3", + "display_name": "o3", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "cost": { + "input": 2, + "output": 8 + }, + "type": "chat" + }, + { + "id": "claude-sonnet-4-20250514", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-05-14", + "last_updated": "2025-05-14", + "cost": { + "input": 3, + "output": 15 + }, + "type": "chat" + }, + { + "id": "grok-4-fast-non-reasoning", + "name": "Grok 4 Fast (Non-Reasoning)", + "display_name": "Grok 4 Fast (Non-Reasoning)", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2000000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-07-09", + "last_updated": "2025-07-09", + "cost": { + "input": 0.2, + "output": 0.5 + }, + "type": "chat" + }, + { + "id": "kimi-k2-turbo-preview", + "name": "Kimi K2 Turbo Preview", + "display_name": "Kimi K2 Turbo Preview", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-07-08", + "last_updated": "2025-07-08", + "cost": { + "input": 0.15, + "output": 8 + }, + "type": "chat" + }, + { + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.25, + "output": 10 + }, + "type": "chat" + }, + { + "id": "gpt-5.3-chat-latest", + "name": "GPT-5.3 Chat Latest", + "display_name": "GPT-5.3 Chat Latest", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-03-01", + "last_updated": "2026-03-01", + "cost": { + "input": 1.75, + "output": 14 + }, + "type": "chat" + }, + { + "id": "deepseek-ai/DeepSeek-R1", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "cost": { + "input": 3, + "output": 7 + }, + "type": "chat" + }, + { + "id": "deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-06-01", + "last_updated": "2025-06-01", + "cost": { + "input": 0.27, + "output": 1 + }, + "type": "chat" + }, + { + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-06-15", + "last_updated": "2025-06-15", + "cost": { + "input": 0.27, + "output": 0.4 + }, + "type": "chat" + }, + { + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS 120B", + "display_name": "GPT-OSS 120B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.08, + "output": 0.44 + }, + "type": "chat" + }, + { + "id": "zai-org/glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-03-01", + "last_updated": "2025-03-01", + "cost": { + "input": 0.6, + "output": 2.2 + }, + "type": "chat" + }, + { + "id": "zai-org/glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "cost": { + "input": 0.6, + "output": 2.2 + }, + "type": "chat" + }, + { + "id": "zai-org/glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-06-01", + "last_updated": "2025-06-01", + "cost": { + "input": 0.6, + "output": 2.2 + }, + "type": "chat" + }, + { + "id": "zai-org/glm-5", + "name": "GLM-5", + "display_name": "GLM-5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "cost": { + "input": 1, + "output": 3.2 + }, + "type": "chat" + }, + { + "id": "deepseek/deepseek-v3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "cost": { + "input": 0.55, + "output": 1.66 + }, + "type": "chat" + }, + { + "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0.02, + "output": 0.05 + }, + "type": "chat" + }, + { + "id": "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo", + "name": "Llama 3.1 405B Instruct Turbo", + "display_name": "Llama 3.1 405B Instruct Turbo", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 3.5, + "output": 3.5 + }, + "type": "chat" + }, + { + "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "cost": { + "input": 0.14, + "output": 0.59 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-32B", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-04-29", + "last_updated": "2025-04-29", + "cost": { + "input": 0.09, + "output": 0.29 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct", + "display_name": "Qwen3 235B A22B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-07-01", + "last_updated": "2025-07-01", + "cost": { + "input": 0.13, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "Qwen/QwQ-32B", + "name": "QwQ 32B", + "display_name": "QwQ 32B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32768, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-11-28", + "last_updated": "2024-11-28", + "cost": { + "input": 0.4, + "output": 0.4 + }, + "type": "chat" + }, + { + "id": "Qwen/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-07-22", + "last_updated": "2025-07-22", + "cost": { + "input": 0.29, + "output": 1.2 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen 2.5 72B Instruct", + "display_name": "Qwen 2.5 72B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-09-19", + "last_updated": "2024-09-19", + "cost": { + "input": 0.11, + "output": 0.38 + }, + "type": "chat" + } + ] + }, + "privatemode-ai": { + "id": "privatemode-ai", + "name": "Privatemode AI", + "display_name": "Privatemode AI", + "api": "http://localhost:8080/v1", + "doc": "https://docs.privatemode.ai/api/overview", + "models": [ + { + "id": "gemma-3-27b", + "name": "Gemma 3 27B", + "display_name": "Gemma 3 27B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-03-12", + "last_updated": "2025-03-12", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + }, + { + "id": "whisper-large-v3", + "name": "Whisper large-v3", + "display_name": "Whisper large-v3", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2023-09", + "release_date": "2023-09-01", + "last_updated": "2023-09-01", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + }, + { + "id": "qwen3-embedding-4b", + "name": "Qwen3-Embedding 4B", + "display_name": "Qwen3-Embedding 4B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 2560 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-06-06", + "last_updated": "2025-06-06", + "cost": { + "input": 0, + "output": 0 + }, + "type": "embedding" + }, + { + "id": "qwen3-coder-30b-a3b", + "name": "Qwen3-Coder 30B-A3B", + "display_name": "Qwen3-Coder 30B-A3B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + }, + { + "id": "gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-08-04", + "last_updated": "2025-08-14", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + } + ] + }, + "minimax-cn-coding-plan": { + "id": "minimax-cn-coding-plan", + "name": "MiniMax Token Plan (minimaxi.com)", + "display_name": "MiniMax Token Plan (minimaxi.com)", + "api": "https://api.minimaxi.com/anthropic/v1", + "doc": "https://platform.minimaxi.com/docs/token-plan/intro", + "models": [ + { + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + }, + { + "id": "MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" + }, + { + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" + }, + { + "id": "MiniMax-M2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" + }, + { + "id": "MiniMax-M2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "display_name": "MiniMax-M2.5-highspeed", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" + }, + { + "id": "MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 196608, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + } + ] + }, + "xiaomi-token-plan-ams": { + "id": "xiaomi-token-plan-ams", + "name": "Xiaomi Token Plan (Europe)", + "display_name": "Xiaomi Token Plan (Europe)", + "api": "https://token-plan-ams.xiaomimimo.com/v1", + "doc": "https://platform.xiaomimimo.com/#/docs", + "models": [ + { + "id": "mimo-v2-tts", + "name": "MiMo-V2-TTS", + "display_name": "MiMo-V2-TTS", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "limit": { + "context": 8192, + "output": 16384 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + }, + { + "id": "mimo-v2.5", + "name": "MiMo-V2.5", + "display_name": "MiMo-V2.5", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 + }, + "type": "chat" + }, + { + "id": "mimo-v2-pro", + "name": "MiMo-V2-Pro", + "display_name": "MiMo-V2-Pro", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 + }, + "type": "chat" + }, + { + "id": "mimo-v2-flash", + "name": "MiMo-V2-Flash", + "display_name": "MiMo-V2-Flash", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 + }, + "type": "chat" + }, + { + "id": "mimo-v2.5-pro", + "name": "MiMo-V2.5-Pro", + "display_name": "MiMo-V2.5-Pro", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 + }, + "type": "chat" + }, + { + "id": "mimo-v2-omni", + "name": "MiMo-V2-Omni", + "display_name": "MiMo-V2-Omni", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 + }, + "type": "chat" + } + ] + }, + "cloudferro-sherlock": { + "id": "cloudferro-sherlock", + "name": "CloudFerro Sherlock", + "display_name": "CloudFerro Sherlock", + "api": "https://api-sherlock.cloudferro.com/openai/v1/", + "doc": "https://docs.sherlock.cloudferro.com/", + "models": [ + { + "id": "openai/gpt-oss-120b", + "name": "OpenAI GPT OSS 120B", + "display_name": "OpenAI GPT OSS 120B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131000, + "output": 131000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-28", + "last_updated": "2025-08-28", + "cost": { + "input": 2.92, + "output": 2.92 + }, + "type": "chat" + }, + { + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 70000, + "output": 70000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-10-09", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 2.92, + "output": 2.92 + }, + "type": "chat" + }, + { + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 196000, + "output": 16000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2026-01", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", + "cost": { + "input": 0.3, + "output": 1.2 + }, + "type": "chat" + }, + { + "id": "speakleash/Bielik-11B-v2.6-Instruct", + "name": "Bielik 11B v2.6 Instruct", + "display_name": "Bielik 11B v2.6 Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-03", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "cost": { + "input": 0.67, + "output": 0.67 + }, + "type": "chat" + }, + { + "id": "speakleash/Bielik-11B-v3.0-Instruct", + "name": "Bielik 11B v3.0 Instruct", + "display_name": "Bielik 11B v3.0 Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-03", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "cost": { + "input": 0.67, + "output": 0.67 + }, + "type": "chat" + } + ] + }, + "openai": { + "id": "openai", + "name": "OpenAI", + "display_name": "OpenAI", + "doc": "https://platform.openai.com/docs/models", + "models": [ + { + "id": "text-embedding-3-large", + "name": "text-embedding-3-large", + "display_name": "text-embedding-3-large", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8191, + "output": 3072 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-01", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", + "cost": { + "input": 0.13, + "output": 0 + }, + "type": "embedding" + }, + { + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", + "cost": { + "input": 2.5, + "output": 10, + "cache_read": 1.25 + }, + "type": "chat" + }, + { + "id": "gpt-image-1-mini", + "name": "gpt-image-1-mini", + "display_name": "gpt-image-1-mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text", + "image" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-09-26", + "last_updated": "2025-09-26", + "type": "imageGeneration" + }, + { + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 + }, + "type": "chat" + }, + { + "id": "gpt-3.5-turbo", + "name": "GPT-3.5-turbo", + "display_name": "GPT-3.5-turbo", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16385, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2021-09-01", + "release_date": "2023-03-01", + "last_updated": "2023-11-06", + "cost": { + "input": 0.5, + "output": 1.5, + "cache_read": 1.25 + }, + "type": "chat" + }, + { + "id": "o3-pro", + "name": "o3-pro", + "display_name": "o3-pro", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", + "cost": { + "input": 20, + "output": 80 + }, + "type": "chat" + }, + { + "id": "o1-preview", + "name": "o1-preview", + "display_name": "o1-preview", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", + "cost": { + "input": 15, + "output": 60, + "cache_read": 7.5 + }, + "type": "chat" + }, + { + "id": "gpt-5.4-nano", + "name": "GPT-5.4 nano", + "display_name": "GPT-5.4 nano", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", + "cost": { + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 + }, + "type": "chat" + }, + { + "id": "gpt-5-chat-latest", + "name": "GPT-5 Chat (latest)", + "display_name": "GPT-5 Chat (latest)", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.25, + "output": 10 + }, + "type": "chat" + }, + { + "id": "text-embedding-ada-002", + "name": "text-embedding-ada-002", + "display_name": "text-embedding-ada-002", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 1536 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2022-12", + "release_date": "2022-12-15", + "last_updated": "2022-12-15", + "cost": { + "input": 0.1, + "output": 0 + }, + "type": "embedding" + }, + { + "id": "gpt-5.5-pro", + "name": "GPT-5.5 Pro", + "display_name": "GPT-5.5 Pro", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1050000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", + "cost": { + "input": 30, + "output": 180, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 60, + "output": 270 + } + }, + "type": "chat" + }, + { + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex mini", + "display_name": "GPT-5.1 Codex mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.025 + }, + "type": "chat" + }, + { + "id": "gpt-5.2-pro", + "name": "GPT-5.2 Pro", + "display_name": "GPT-5.2 Pro", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 21, + "output": 168 + }, + "type": "chat" + }, + { + "id": "gpt-4o-2024-05-13", + "name": "GPT-4o (2024-05-13)", + "display_name": "GPT-4o (2024-05-13)", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", + "cost": { + "input": 5, + "output": 15 + }, + "type": "chat" + }, + { + "id": "chatgpt-image-latest", + "name": "chatgpt-image-latest", + "display_name": "chatgpt-image-latest", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text", + "image" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-16", + "last_updated": "2025-12-16", + "type": "chat" + }, + { + "id": "gpt-5.3-codex-spark", + "name": "GPT-5.3 Codex Spark", + "display_name": "GPT-5.3 Codex Spark", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 + }, + "type": "chat" + }, + { + "id": "gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + }, + "type": "chat" + }, + { + "id": "gpt-5.1-chat-latest", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + }, + "type": "chat" + }, + { + "id": "gpt-image-1.5", + "name": "gpt-image-1.5", + "display_name": "gpt-image-1.5", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text", + "image" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-25", + "last_updated": "2025-11-25", + "type": "imageGeneration" + }, + { + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1047576, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 2, + "output": 8, + "cache_read": 0.5 + }, + "type": "chat" + }, + { + "id": "text-embedding-3-small", + "name": "text-embedding-3-small", + "display_name": "text-embedding-3-small", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8191, + "output": 1536 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-01", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", + "cost": { + "input": 0.02, + "output": 0 + }, + "type": "embedding" + }, + { + "id": "gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 272000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", + "cost": { + "input": 15, + "output": 120 + }, + "type": "chat" + }, + { + "id": "gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1047576, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 + }, + "type": "chat" + }, + { + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.13 + }, + "type": "chat" + }, + { + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 + }, + "type": "chat" + }, + { + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1050000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", + "cost": { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + } + }, + "type": "chat" + }, + { + "id": "gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 + }, + "type": "chat" + }, + { + "id": "o1-pro", + "name": "o1-pro", + "display_name": "o1-pro", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2025-03-19", + "last_updated": "2025-03-19", + "cost": { + "input": 150, + "output": 600 + }, + "type": "chat" + }, + { + "id": "gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", + "cost": { + "input": 10, + "output": 30 + }, + "type": "chat" + }, + { + "id": "gpt-5.4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", + "cost": { + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 + }, + "type": "chat" + }, + { + "id": "o1", + "name": "o1", + "display_name": "o1", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", + "cost": { + "input": 15, + "output": 60, + "cache_read": 7.5 + }, + "type": "chat" + }, + { + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + }, + "type": "chat" + }, + { + "id": "gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1050000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", + "cost": { + "input": 5, + "output": 30, + "cache_read": 0.5, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + } + }, + "type": "chat" + }, + { + "id": "gpt-5.4-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1050000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", + "cost": { + "input": 30, + "output": 180, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 60, + "output": 270 + } + }, + "type": "chat" + }, + { + "id": "gpt-5.2-chat-latest", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 + }, + "type": "chat" + }, + { + "id": "o4-mini-deep-research", + "name": "o4-mini-deep-research", + "display_name": "o4-mini-deep-research", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-06-26", + "last_updated": "2024-06-26", + "cost": { + "input": 2, + "output": 8, + "cache_read": 0.5 + }, + "type": "chat" + }, + { + "id": "gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1047576, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 + }, + "type": "chat" + }, + { + "id": "gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", + "cost": { + "input": 30, + "output": 60 + }, + "type": "chat" + }, + { + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 + }, + "type": "chat" + }, + { + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + }, + "type": "chat" + }, + { + "id": "gpt-4o-2024-11-20", + "name": "GPT-4o (2024-11-20)", + "display_name": "GPT-4o (2024-11-20)", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", + "cost": { + "input": 2.5, + "output": 10, + "cache_read": 1.25 + }, + "type": "chat" + }, + { + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 + }, + "type": "chat" + }, + { + "id": "gpt-image-1", + "name": "gpt-image-1", + "display_name": "gpt-image-1", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-04-24", + "last_updated": "2025-04-24", + "type": "imageGeneration" + }, + { + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.025 + }, + "type": "chat" + }, + { + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + }, + "type": "chat" + }, + { + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 + }, + "type": "chat" + }, + { + "id": "gpt-4o-2024-08-06", + "name": "GPT-4o (2024-08-06)", + "display_name": "GPT-4o (2024-08-06)", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-08-06", + "last_updated": "2024-08-06", + "cost": { + "input": 2.5, + "output": 10, + "cache_read": 1.25 + }, + "type": "chat" + }, + { + "id": "o3", + "name": "o3", + "display_name": "o3", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "cost": { + "input": 2, + "output": 8, + "cache_read": 0.5 + }, + "type": "chat" + }, + { + "id": "o1-mini", + "name": "o1-mini", + "display_name": "o1-mini", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 65536 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + }, + "type": "chat" + }, + { + "id": "o3-deep-research", + "name": "o3-deep-research", + "display_name": "o3-deep-research", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-06-26", + "last_updated": "2024-06-26", + "cost": { + "input": 10, + "output": 40, + "cache_read": 2.5 + }, + "type": "chat" + }, + { + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + }, + "type": "chat" + }, + { + "id": "gpt-5.3-chat-latest", + "name": "GPT-5.3 Chat (latest)", + "display_name": "GPT-5.3 Chat (latest)", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 + }, + "type": "chat" + }, + { + "id": "gpt-image-2", + "name": "gpt-image-2", + "display_name": "gpt-image-2", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-04-21", + "last_updated": "2026-04-21", + "cost": { + "input": 5, + "output": 30, + "cache_read": 1.25 + }, + "type": "imageGeneration" + } + ] + }, + "dinference": { + "id": "dinference", + "name": "DInference", + "display_name": "DInference", + "api": "https://api.dinference.com/v1", + "doc": "https://dinference.com", + "models": [ + { + "id": "gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08", + "last_updated": "2025-08", + "cost": { + "input": 0.0675, + "output": 0.27 + }, + "type": "chat" + }, + { + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", + "cost": { + "input": 1.25, + "output": 3.89 + }, + "type": "chat" + }, + { + "id": "minimax-m2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "cost": { + "input": 0.22, + "output": 0.88 + }, + "type": "chat" + }, + { + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "cost": { + "input": 0.45, + "output": 1.65 + }, + "type": "chat" + }, + { + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "cost": { + "input": 0.75, + "output": 2.4 + }, + "type": "chat" + } + ] + }, + "vivgrid": { + "id": "vivgrid", + "name": "Vivgrid", + "display_name": "Vivgrid", + "api": "https://api.vivgrid.com/v1", + "doc": "https://docs.vivgrid.com/models", + "models": [ + { + "id": "gpt-5.4-nano", + "name": "GPT-5.4 Nano", + "display_name": "GPT-5.4 Nano", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", + "cost": { + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 + }, + "type": "chat" + }, + { + "id": "deepseek-v3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "cost": { + "input": 0.28, + "output": 0.42 + }, + "type": "chat" + }, + { + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", + "cost": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + }, + "type": "chat" + }, + { + "id": "gpt-5.4-mini", + "name": "GPT-5.4 Mini", + "display_name": "GPT-5.4 Mini", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", + "cost": { + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 + }, + "type": "chat" + }, + { + "id": "gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", + "cost": { + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "cache_write": 1 + }, + "type": "chat" + }, + { + "id": "gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", + "cost": { + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } + }, + "type": "chat" + }, + { + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + }, + "type": "chat" + }, + { + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + }, + "type": "chat" + }, + { + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 + }, + "type": "chat" + }, + { + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 272000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.03 + }, + "type": "chat" + }, + { + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 + }, + "type": "chat" + }, + { + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 384000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", + "cost": { + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 + }, + "type": "chat" + }, + { + "id": "gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1050000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", + "cost": { + "input": 5, + "output": 30, + "cache_read": 0.5, + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + }, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ] + }, + "type": "chat" + } + ] + }, + "cerebras": { + "id": "cerebras", + "name": "Cerebras", + "display_name": "Cerebras", + "doc": "https://inference-docs.cerebras.ai/models/overview", + "models": [ + { + "id": "zai-glm-4.7", + "name": "Z.AI GLM-4.7", + "display_name": "Z.AI GLM-4.7", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 40000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-01-10", + "last_updated": "2026-01-10", + "cost": { + "input": 2.25, + "output": 2.75, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" + }, + { + "id": "qwen-3-235b-a22b-instruct-2507", + "name": "Qwen 3 235B Instruct", + "display_name": "Qwen 3 235B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", + "cost": { + "input": 0.6, + "output": 1.2 + }, + "type": "chat" + }, + { + "id": "gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.25, + "output": 0.69 + }, + "type": "chat" + }, + { + "id": "llama3.1-8b", + "name": "Llama 3.1 8B", + "display_name": "Llama 3.1 8B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0.1, + "output": 0.1 + }, + "type": "chat" + } + ] + }, + "cloudflare-ai-gateway": { + "id": "cloudflare-ai-gateway", + "name": "Cloudflare AI Gateway", + "display_name": "Cloudflare AI Gateway", + "doc": "https://developers.cloudflare.com/ai-gateway/", + "models": [ + { + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", + "cost": { + "input": 2.5, + "output": 10, + "cache_read": 1.25 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 + }, + "type": "chat" + }, + { + "id": "openai/gpt-3.5-turbo", + "name": "GPT-3.5-turbo", + "display_name": "GPT-3.5-turbo", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16385, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2021-09-01", + "release_date": "2023-03-01", + "last_updated": "2023-11-06", + "cost": { + "input": 0.5, + "output": 1.5, + "cache_read": 1.25 + }, + "type": "chat" + }, + { + "id": "openai/o3-pro", + "name": "o3-pro", + "display_name": "o3-pro", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", + "cost": { + "input": 20, + "output": 80 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.13 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1050000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", + "cost": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + }, + "type": "chat" + }, + { + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 + }, + "type": "chat" + }, + { + "id": "openai/gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", + "cost": { + "input": 10, + "output": 30 + }, + "type": "chat" + }, + { + "id": "openai/o1", + "name": "o1", + "display_name": "o1", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", + "cost": { + "input": 15, + "output": 60, + "cache_read": 7.5 + }, + "type": "chat" + }, + { + "id": "openai/gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", + "cost": { + "input": 30, + "output": 60 + }, + "type": "chat" + }, + { + "id": "openai/o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 + }, + "type": "chat" + }, + { + "id": "openai/o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" @@ -57045,167 +65423,242 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": false, "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2026-05-01", + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 0, - "output": 0 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "stepfun/step-3.5-flash", - "name": "StepFun: Step 3.5 Flash", - "display_name": "StepFun: Step 3.5 Flash", + "id": "openai/gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-01-29", - "last_updated": "2026-01-29", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.02 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "alpindale/goliath-120b", - "name": "Goliath 120B", - "display_name": "Goliath 120B", + "id": "openai/o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 6144, - "output": 1024 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2023-11-10", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 3.75, - "output": 7.5 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "mistralai/mistral-nemo", - "name": "Mistral: Mistral Nemo", - "display_name": "Mistral: Mistral Nemo", + "id": "anthropic/claude-haiku-4-5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-01", - "last_updated": "2024-07-30", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.02, - "output": 0.04 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "mistralai/mistral-saba", - "name": "Mistral: Saba", - "display_name": "Mistral: Saba", + "id": "anthropic/claude-3-sonnet", + "name": "Claude Sonnet 3", + "display_name": "Claude Sonnet 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-02-17", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", "cost": { - "input": 0.2, - "output": 0.6 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "mistralai/mistral-large-2512", - "name": "Mistral: Mistral Large 3 2512", - "display_name": "Mistral: Mistral Large 3 2512", + "id": "anthropic/claude-3-haiku", + "name": "Claude Haiku 3", + "display_name": "Claude Haiku 3", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 52429 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -57213,95 +65666,113 @@ "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2024-11-01", - "last_updated": "2025-12-16", + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "mistralai/devstral-medium", - "name": "Mistral: Devstral Medium", - "display_name": "Mistral: Devstral Medium", + "id": "anthropic/claude-sonnet-4-5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-10", - "last_updated": "2025-07-10", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.4, - "output": 2 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "mistralai/mistral-small-3.1-24b-instruct", - "name": "Mistral: Mistral Small 3.1 24B", - "display_name": "Mistral: Mistral Small 3.1 24B", + "id": "anthropic/claude-3.5-sonnet", + "name": "Claude Sonnet 3.5 v2", + "display_name": "Claude Sonnet 3.5 v2", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 131072 + "context": 200000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-17", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.35, - "output": 0.56, - "cache_read": 0.015 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "mistralai/mistral-medium-3-5", - "name": "Mistral: Mistral Medium 3.5", - "display_name": "Mistral: Mistral Medium 3.5", + "id": "anthropic/claude-opus-4", + "name": "Claude Opus 4 (latest)", + "display_name": "Claude Opus 4 (latest)", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -57311,249 +65782,408 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-05-07", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 1.5, - "output": 7.5 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "mistralai/pixtral-large-2411", - "name": "Mistral: Pixtral Large 2411", - "display_name": "Mistral: Pixtral Large 2411", + "id": "anthropic/claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2024-11-19", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 2, - "output": 6 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5 + } }, "type": "chat" }, { - "id": "mistralai/devstral-2512", - "name": "Mistral: Devstral 2 2512", - "display_name": "Mistral: Devstral 2 2512", + "id": "anthropic/claude-opus-4-1", + "name": "Claude Opus 4.1 (latest)", + "display_name": "Claude Opus 4.1 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-12", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.025 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "mistralai/codestral-2508", - "name": "Mistral: Codestral 2508", - "display_name": "Mistral: Codestral 2508", + "id": "anthropic/claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 51200 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-01", - "last_updated": "2025-08-01", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2026-01", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.3, - "output": 0.9 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "mistralai/mistral-small-24b-instruct-2501", - "name": "Mistral: Mistral Small 3", - "display_name": "Mistral: Mistral Small 3", + "id": "anthropic/claude-3-opus", + "name": "Claude Opus 3", + "display_name": "Claude Opus 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-01-10", + "attachment": true, + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", "cost": { - "input": 0.05, - "output": 0.08 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "mistralai/mistral-large-2411", - "name": "Mistral Large 2411", - "display_name": "Mistral Large 2411", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4 (latest)", + "display_name": "Claude Sonnet 4 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-24", - "last_updated": "2024-11-04", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 2, - "output": 6 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "mistralai/mixtral-8x22b-instruct", - "name": "Mistral: Mixtral 8x22B Instruct", - "display_name": "Mistral: Mixtral 8x22B Instruct", + "id": "anthropic/claude-3-5-haiku", + "name": "Claude Haiku 3.5 (latest)", + "display_name": "Claude Haiku 3.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 13108 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-17", - "last_updated": "2024-04-17", + "attachment": true, + "open_weights": false, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 2, - "output": 6 + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "mistralai/mistral-large-2407", - "name": "Mistral Large 2407", - "display_name": "Mistral Large 2407", + "id": "anthropic/claude-opus-4-6", + "name": "Claude Opus 4.6 (latest)", + "display_name": "Claude Opus 4.6 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-11-19", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 2, - "output": 6 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "tiers": [ + { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5 + } }, "type": "chat" }, { - "id": "mistralai/ministral-8b-2512", - "name": "Mistral: Ministral 3 8B 2512", - "display_name": "Mistral: Ministral 3 8B 2512", + "id": "anthropic/claude-3.5-haiku", + "name": "Claude Haiku 3.5 (latest)", + "display_name": "Claude Haiku 3.5 (latest)", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -57561,88 +66191,148 @@ "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "mistralai/mistral-medium-3.1", - "name": "Mistral: Mistral Medium 3.1", - "display_name": "Mistral: Mistral Medium 3.1", + "id": "anthropic/claude-opus-4-5", + "name": "Claude Opus 4.5 (latest)", + "display_name": "Claude Opus 4.5 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "release_date": "2025-08-12", - "last_updated": "2025-08-12", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.4, - "output": 2 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "mistralai/mistral-small-2603", - "name": "Mistral: Mistral Small 4", - "display_name": "Mistral: Mistral Small 4", + "id": "openai/gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, - "open_weights": true, - "release_date": "2026-03-16", - "last_updated": "2026-04-11", + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.015 + "input": 5, + "output": 30, + "cache_read": 0.5, + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + }, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" - }, + } + ] + }, + "vultr": { + "id": "vultr", + "name": "Vultr", + "display_name": "Vultr", + "api": "https://api.vultrinference.com/v1", + "doc": "https://api.vultrinference.com/", + "models": [ { - "id": "mistralai/ministral-3b-2512", - "name": "Mistral: Ministral 3 3B 2512", - "display_name": "Mistral: Ministral 3 3B 2512", + "id": "Kimi-K2.5", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -57650,60 +66340,77 @@ ] }, "limit": { - "context": 131072, + "context": 254000, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2026-03-15", + "knowledge": "2024-04", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.55, + "output": 2.75 }, "type": "chat" }, { - "id": "mistralai/voxtral-small-24b-2507", - "name": "Mistral: Voxtral Small 24B 2507", - "display_name": "Mistral: Voxtral Small 24B 2507", + "id": "DeepSeek-V3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ - "text", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 6400 + "context": 127000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.55, + "output": 1.65 }, "type": "chat" }, { - "id": "mistralai/mixtral-8x7b-instruct", - "name": "Mistral: Mixtral 8x7B Instruct", - "display_name": "Mistral: Mixtral 8x7B Instruct", + "id": "MiniMax-M2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -57713,63 +66420,73 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 194000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2023-12-10", - "last_updated": "2026-03-15", + "knowledge": "2024-09", + "release_date": "2025-02-11", + "last_updated": "2025-02-11", "cost": { - "input": 0.54, - "output": 0.54 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "mistralai/mistral-medium-3", - "name": "Mistral: Mistral Medium 3", - "display_name": "Mistral: Mistral Medium 3", + "id": "gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 129000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.4, - "output": 2 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "mistralai/mistral-small-3.2-24b-instruct", - "name": "Mistral: Mistral Small 3.2 24B", - "display_name": "Mistral: Mistral Small 3.2 24B", + "id": "GLM-5-FP8", + "name": "GLM 5 FP8", + "display_name": "GLM 5 FP8", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -57777,7 +66494,7 @@ ] }, "limit": { - "context": 131072, + "context": 200000, "output": 131072 }, "temperature": true, @@ -57785,21 +66502,30 @@ "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-06-20", - "last_updated": "2025-06-20", + "knowledge": "2025-05", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.06, - "output": 0.18, - "cache_read": 0.03 + "input": 0.85, + "output": 3.1 }, "type": "chat" - }, + } + ] + }, + "kuae-cloud-coding-plan": { + "id": "kuae-cloud-coding-plan", + "name": "KUAE Cloud Coding Plan", + "display_name": "KUAE Cloud Coding Plan", + "api": "https://coding-plan-endpoint.kuaecloud.net/v1", + "doc": "https://docs.mthreads.com/kuaecloud/kuaecloud-doc-online/coding_plan/", + "models": [ { - "id": "mistralai/devstral-small", - "name": "Mistral: Devstral Small 1.1", - "display_name": "Mistral: Devstral Small 1.1", + "id": "GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -57809,28 +66535,52 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2025-05-07", - "last_updated": "2025-07-10", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "modelscope": { + "id": "modelscope", + "name": "ModelScope", + "display_name": "ModelScope", + "api": "https://api-inference.modelscope.cn/v1", + "doc": "https://modelscope.cn/docs/model-service/API-Inference/intro", + "models": [ { - "id": "mistralai/mistral-large", - "name": "Mistral Large", - "display_name": "Mistral Large", + "id": "ZhipuAI/GLM-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -57840,28 +66590,30 @@ ] }, "limit": { - "context": 128000, - "output": 25600 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-07-24", - "last_updated": "2025-12-02", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 2, - "output": 6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mistralai/mistral-7b-instruct-v0.1", - "name": "Mistral: Mistral 7B Instruct v0.1", - "display_name": "Mistral: Mistral 7B Instruct v0.1", + "id": "ZhipuAI/GLM-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -57871,60 +66623,35 @@ ] }, "limit": { - "context": 2824, - "output": 565 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-03", - "last_updated": "2025-04-03", - "cost": { - "input": 0.11, - "output": 0.19 - }, - "type": "chat" - }, - { - "id": "mistralai/ministral-14b-2512", - "name": "Mistral: Ministral 3 14B 2512", - "display_name": "Mistral: Ministral 3 14B 2512", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 52429 + "context": 202752, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta-llama/llama-3.3-70b-instruct", - "name": "Meta: Llama 3.3 70B Instruct", - "display_name": "Meta: Llama 3.3 70B Instruct", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen3-235B-A22B-Thinking-2507", "modalities": { "input": [ "text" @@ -57934,39 +66661,51 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2024-08-01", - "last_updated": "2026-02-04", + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 0.1, - "output": 0.32 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta-llama/llama-4-scout", - "name": "Meta: Llama 4 Scout", - "display_name": "Meta: Llama 4 Scout", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 327680, + "context": 262144, "output": 16384 }, "temperature": true, @@ -57974,20 +66713,21 @@ "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { - "input": 0.08, - "output": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta-llama/llama-guard-3-8b", - "name": "Llama Guard 3 8B", - "display_name": "Llama Guard 3 8B", + "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ "text" @@ -57997,95 +66737,116 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 262144, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-04-18", - "last_updated": "2026-02-04", + "knowledge": "2025-04", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "cost": { - "input": 0.02, - "output": 0.06 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta-llama/llama-4-maverick", - "name": "Meta: Llama 4 Maverick", - "display_name": "Meta: Llama 4 Maverick", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 16384 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-12-24", + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-07-21", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta-llama/llama-3.2-11b-vision-instruct", - "name": "Meta: Llama 3.2 11B Vision Instruct", - "display_name": "Meta: Llama 3.2 11B Vision Instruct", + "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "name": "Qwen3 30B A3B Thinking 2507", + "display_name": "Qwen3 30B A3B Thinking 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { - "input": 0.049, - "output": 0.049 + "input": 0, + "output": 0 }, "type": "chat" - }, + } + ] + }, + "kimi-for-coding": { + "id": "kimi-for-coding", + "name": "Kimi For Coding", + "display_name": "Kimi For Coding", + "api": "https://api.kimi.com/coding/v1", + "doc": "https://www.kimi.com/coding/docs/en/third-party-agents.html", + "models": [ { - "id": "meta-llama/llama-guard-4-12b", - "name": "Meta: Llama Guard 4 12B", - "display_name": "Meta: Llama Guard 4 12B", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -58093,90 +66854,126 @@ ] }, "limit": { - "context": 163840, + "context": 262144, "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2025-07", + "release_date": "2025-11", + "last_updated": "2025-12", "cost": { - "input": 0.18, - "output": 0.18 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "meta-llama/llama-3.1-70b-instruct", - "name": "Meta: Llama 3.1 70B Instruct", - "display_name": "Meta: Llama 3.1 70B Instruct", + "id": "k2p6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-07-16", - "last_updated": "2024-07-23", + "knowledge": "2025-01", + "release_date": "2026-04", + "last_updated": "2026-04", "cost": { - "input": 0.4, - "output": 0.4 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "meta-llama/llama-3.2-1b-instruct", - "name": "Meta: Llama 3.2 1B Instruct", - "display_name": "Meta: Llama 3.2 1B Instruct", + "id": "k2p5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 60000, - "output": 12000 + "context": 262144, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-09-18", - "last_updated": "2026-01-27", + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.027, - "output": 0.2 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "lucidquery": { + "id": "lucidquery", + "name": "LucidQuery AI", + "display_name": "LucidQuery AI", + "api": "https://lucidquery.com/api/v1", + "doc": "https://lucidquery.com/api/docs", + "models": [ { - "id": "meta-llama/llama-3.2-3b-instruct", - "name": "Meta: Llama 3.2 3B Instruct", - "display_name": "Meta: Llama 3.2 3B Instruct", + "id": "lucidquery-nexus-coder", + "name": "LucidQuery Nexus Coder", + "display_name": "LucidQuery Nexus Coder", "modalities": { "input": [ "text" @@ -58186,28 +66983,30 @@ ] }, "limit": { - "context": 80000, - "output": 16384 + "context": 250000, + "output": 60000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-09-18", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-01", + "release_date": "2025-09-01", + "last_updated": "2025-09-01", "cost": { - "input": 0.051, - "output": 0.34 + "input": 2, + "output": 5 }, "type": "chat" }, { - "id": "meta-llama/llama-3-8b-instruct", - "name": "Meta: Llama 3 8B Instruct", - "display_name": "Meta: Llama 3 8B Instruct", + "id": "lucidnova-rf1-100b", + "name": "LucidNova RF1 100B", + "display_name": "LucidNova RF1 100B", "modalities": { "input": [ "text" @@ -58217,28 +67016,39 @@ ] }, "limit": { - "context": 8192, - "output": 16384 + "context": 120000, + "output": 8000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-25", - "last_updated": "2025-04-03", + "attachment": true, + "open_weights": false, + "knowledge": "2025-09-16", + "release_date": "2024-12-28", + "last_updated": "2025-09-10", "cost": { - "input": 0.03, - "output": 0.04 + "input": 2, + "output": 5 }, "type": "chat" - }, + } + ] + }, + "neuralwatt": { + "id": "neuralwatt", + "name": "Neuralwatt", + "display_name": "Neuralwatt", + "api": "https://api.neuralwatt.com/v1", + "doc": "https://portal.neuralwatt.com/docs", + "models": [ { - "id": "meta-llama/llama-3.1-8b-instruct", - "name": "Meta: Llama 3.1 8B Instruct", - "display_name": "Meta: Llama 3.1 8B Instruct", + "id": "qwen3.5-397b-fast", + "name": "Qwen3.5 397B Fast", + "display_name": "Qwen3.5 397B Fast", "modalities": { "input": [ "text" @@ -58248,28 +67058,39 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 262128, + "output": 262128 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2025-12-23", + "release_date": "2026-02-01", + "last_updated": "2026-02-01", "cost": { - "input": 0.02, - "output": 0.05 + "input": 0.69, + "output": 4.14 }, "type": "chat" }, { - "id": "meta-llama/llama-3-70b-instruct", - "name": "Meta: Llama 3 70B Instruct", - "display_name": "Meta: Llama 3 70B Instruct", + "id": "glm-5-fast", + "name": "GLM 5 Fast", + "display_name": "GLM 5 Fast", "modalities": { "input": [ "text" @@ -58279,32 +67100,30 @@ ] }, "limit": { - "context": 8192, - "output": 8000 + "context": 202736, + "output": 202736 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 0.51, - "output": 0.74 + "input": 1.1, + "output": 3.6 }, "type": "chat" }, { - "id": "x-ai/grok-4.20", - "name": "xAI: Grok 4.20", - "display_name": "xAI: Grok 4.20", + "id": "glm-5.1-fast", + "name": "GLM 5.1 Fast", + "display_name": "GLM 5.1 Fast", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -58312,102 +67131,103 @@ ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 202736, + "output": 202736 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-31", - "last_updated": "2026-04-11", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2 + "input": 1.1, + "output": 3.6 }, "type": "chat" }, { - "id": "x-ai/grok-code-fast-1:optimized:free", - "name": "xAI: Grok Code Fast 1 Optimized (experimental, free)", - "display_name": "xAI: Grok Code Fast 1 Optimized (experimental, free)", + "id": "kimi-k2.6-fast", + "name": "Kimi K2.6 Fast", + "display_name": "Kimi K2.6 Fast", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 262128, + "output": 262128 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-27", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0, - "output": 0 + "input": 0.69, + "output": 3.22 }, "type": "chat" }, { - "id": "x-ai/grok-4.3", - "name": "xAI: Grok 4.3", - "display_name": "xAI: Grok 4.3", + "id": "qwen3.6-35b-fast", + "name": "Qwen3.6 35B Fast", + "display_name": "Qwen3.6 35B Fast", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 4096 + "context": 131056, + "output": 131056 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "release_date": "2026-05-01", - "last_updated": "2026-05-01", + "open_weights": true, + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2 + "input": 0.05, + "output": 0.1 }, "type": "chat" }, { - "id": "x-ai/grok-4-fast", - "name": "xAI: Grok 4 Fast", - "display_name": "xAI: Grok 4 Fast", + "id": "kimi-k2.5-fast", + "name": "Kimi K2.5 Fast", + "display_name": "Kimi K2.5 Fast", "modalities": { "input": [ "text", @@ -58418,41 +67238,40 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 262128, + "output": 262128 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-08-19", - "last_updated": "2025-08-19", + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.52, + "output": 2.59 }, "type": "chat" }, { - "id": "x-ai/grok-code-fast-1", - "name": "xAI: Grok Code Fast 1", - "display_name": "xAI: Grok Code Fast 1", + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 262128, + "output": 262128 }, "temperature": true, "tool_call": true, @@ -58462,59 +67281,75 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 0.69, + "output": 3.22 }, "type": "chat" }, { - "id": "x-ai/grok-3-beta", - "name": "xAI: Grok 3 Beta", - "display_name": "xAI: Grok 3 Beta", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 262128, + "output": 262128 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0.52, + "output": 2.59 }, "type": "chat" }, { - "id": "x-ai/grok-4", - "name": "xAI: Grok 4", - "display_name": "xAI: Grok 4", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -58522,8 +67357,8 @@ ] }, "limit": { - "context": 256000, - "output": 51200 + "context": 16368, + "output": 16368 }, "temperature": true, "tool_call": true, @@ -58536,21 +67371,20 @@ "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0.03, + "output": 0.16 }, "type": "chat" }, { - "id": "x-ai/grok-3-mini", - "name": "xAI: Grok 3 Mini", - "display_name": "xAI: Grok 3 Mini", + "id": "zai-org/GLM-5.1-FP8", + "name": "GLM 5.1 FP8", + "display_name": "GLM 5.1 FP8", "modalities": { "input": [ "text" @@ -58560,8 +67394,8 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 202736, + "output": 202736 }, "temperature": true, "tool_call": true, @@ -58569,21 +67403,31 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "open_weights": true, + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 0.3, - "output": 0.5, - "cache_read": 0.075 + "input": 1.1, + "output": 3.6 }, "type": "chat" }, { - "id": "x-ai/grok-4.1-fast", - "name": "xAI: Grok 4.1 Fast", - "display_name": "xAI: Grok 4.1 Fast", + "id": "mistralai/Devstral-Small-2-24B-Instruct-2512", + "name": "Devstral Small 2 24B Instruct 2512", + "display_name": "Devstral Small 2 24B Instruct 2512", "modalities": { "input": [ "text", @@ -58594,30 +67438,28 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 262128, + "output": 262128 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "open_weights": true, + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.12, + "output": 0.35 }, "type": "chat" }, { - "id": "x-ai/grok-3-mini-beta", - "name": "xAI: Grok 3 Mini Beta", - "display_name": "xAI: Grok 3 Mini Beta", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -58627,8 +67469,8 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 196592, + "output": 196592 }, "temperature": true, "tool_call": true, @@ -58636,25 +67478,33 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.3, - "output": 0.5, - "cache_read": 0.075 + "input": 0.35, + "output": 1.38 }, "type": "chat" }, { - "id": "x-ai/grok-4.20-multi-agent", - "name": "xAI: Grok 4.20 Multi-Agent", - "display_name": "xAI: Grok 4.20 Multi-Agent", + "id": "Qwen/Qwen3.5-397B-A17B-FP8", + "name": "Qwen3.5 397B A17B FP8", + "display_name": "Qwen3.5 397B A17B FP8", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -58662,73 +67512,105 @@ ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 262128, + "output": 262128 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-31", - "last_updated": "2026-04-11", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-01", + "last_updated": "2026-02-01", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2 + "input": 0.69, + "output": 4.14 }, "type": "chat" }, { - "id": "x-ai/grok-3", - "name": "xAI: Grok 3", - "display_name": "xAI: Grok 3", + "id": "Qwen/Qwen3.6-35B-A3B", + "name": "Qwen3.6 35B A3B", + "display_name": "Qwen3.6 35B A3B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 131056, + "output": 131056 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0.05, + "output": 0.1 }, "type": "chat" - }, + } + ] + }, + "azure-cognitive-services": { + "id": "azure-cognitive-services", + "name": "Azure Cognitive Services", + "display_name": "Azure Cognitive Services", + "doc": "https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models", + "models": [ { - "id": "tencent/hy3-preview:free", - "name": "Tencent: Hy3 Preview (free)", - "display_name": "Tencent: Hy3 Preview (free)", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -58736,238 +67618,371 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-04-22", - "last_updated": "2026-05-01", + "knowledge": "2025-02-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0, - "output": 0 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "tencent/hunyuan-a13b-instruct", - "name": "Tencent: Hunyuan A13B Instruct", - "display_name": "Tencent: Hunyuan A13B Instruct", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-06-30", - "last_updated": "2025-11-25", + "knowledge": "2025-07-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.14, - "output": 0.57 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gryphe/mythomax-l2-13b", - "name": "MythoMax 13B", - "display_name": "MythoMax 13B", + "id": "claude-opus-4-1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 200000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-25", - "last_updated": "2024-04-25", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.06, - "output": 0.06 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "sao10k/l3-euryale-70b", - "name": "Sao10k: Llama 3 Euryale 70B v2.1", - "display_name": "Sao10k: Llama 3 Euryale 70B v2.1", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-06-18", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 1.48, - "output": 1.48 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "tiers": [ + { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5 + } }, "type": "chat" }, { - "id": "sao10k/l3-lunaris-8b", - "name": "Sao10K: Llama 3 8B Lunaris", - "display_name": "Sao10K: Llama 3 8B Lunaris", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true + } }, "attachment": false, "open_weights": true, - "release_date": "2024-08-13", - "last_updated": "2026-03-15", + "knowledge": "2025-01", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.04, - "output": 0.05 + "input": 0.95, + "output": 4 }, "type": "chat" }, { - "id": "sao10k/l3.3-euryale-70b", - "name": "Sao10K: Llama 3.3 Euryale 70B", - "display_name": "Sao10K: Llama 3.3 Euryale 70B", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-12-18", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "cost": { - "input": 0.65, - "output": 0.75 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "sao10k/l3.1-70b-hanami-x1", - "name": "Sao10K: Llama 3.1 70B Hanami x1", - "display_name": "Sao10K: Llama 3.1 70B Hanami x1", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 16000 + "context": 272000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-01-08", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 3, - "output": 3 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "sao10k/l3.1-euryale-70b", - "name": "Sao10K: Llama 3.1 Euryale 70B v2.2", - "display_name": "Sao10K: Llama 3.1 Euryale 70B v2.2", + "id": "grok-4-fast-reasoning", + "name": "Grok 4 Fast (Reasoning)", + "display_name": "Grok 4 Fast (Reasoning)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-08-28", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 0.85, - "output": 0.85 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "microsoft/wizardlm-2-8x22b", - "name": "WizardLM-2 8x22B", - "display_name": "WizardLM-2 8x22B", + "id": "phi-4-mini-reasoning", + "name": "Phi-4-mini-reasoning", + "display_name": "Phi-4-mini-reasoning", "modalities": { "input": [ "text" @@ -58977,31 +67992,34 @@ ] }, "limit": { - "context": 65535, - "output": 8000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-04-24", - "last_updated": "2024-04-24", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.62, - "output": 0.62 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "microsoft/phi-4-mini-instruct", - "name": "Microsoft: Phi 4 Mini Instruct", - "display_name": "Microsoft: Phi 4 Mini Instruct", + "id": "cohere-embed-v-4-0", + "name": "Embed v4", + "display_name": "Embed v4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -59009,28 +68027,27 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 1536 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-10-17", - "last_updated": "2026-05-07", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.08, - "output": 0.35, - "cache_read": 0.08 + "input": 0.12, + "output": 0 }, "type": "chat" }, { - "id": "microsoft/phi-4", - "name": "Microsoft: Phi 4", - "display_name": "Microsoft: Phi 4", + "id": "o1-mini", + "name": "o1-mini", + "display_name": "o1-mini", "modalities": { "input": [ "text" @@ -59040,28 +68057,45 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 128000, + "output": 65536 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 0.06, - "output": 0.14 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "poolside/laguna-m.1:free", - "name": "Poolside: Laguna M.1 (free)", - "display_name": "Poolside: Laguna M.1 (free)", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -59071,123 +68105,176 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-28", - "last_updated": "2026-05-01", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0, - "output": 0 + "input": 0.71, + "output": 0.71 }, "type": "chat" }, { - "id": "poolside/laguna-xs.2:free", - "name": "Poolside: Laguna XS.2 (free)", - "display_name": "Poolside: Laguna XS.2 (free)", + "id": "gpt-5.2-chat", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-04-28", - "last_updated": "2026-05-01", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0, - "output": 0 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "cohere/command-r7b-12-2024", - "name": "Cohere: Command R7B (12-2024)", - "display_name": "Cohere: Command R7B (12-2024)", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "release_date": "2024-02-27", - "last_updated": "2024-02-27", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0.0375, - "output": 0.15 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "cohere/command-a", - "name": "Cohere: Command A", - "display_name": "Cohere: Command A", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 272000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 2.5, - "output": 10 + "input": 0.25, + "output": 2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "cohere/command-r-plus-08-2024", - "name": "Cohere: Command R+ (08-2024)", - "display_name": "Cohere: Command R+ (08-2024)", + "id": "meta-llama-3.1-8b-instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" @@ -59198,7 +68285,7 @@ }, "limit": { "context": 128000, - "output": 4000 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -59207,21 +68294,23 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 2.5, - "output": 10 + "input": 0.3, + "output": 0.61 }, "type": "chat" }, { - "id": "cohere/command-r-08-2024", - "name": "Cohere: Command R (08-2024)", - "display_name": "Cohere: Command R (08-2024)", + "id": "gpt-5-chat", + "name": "GPT-5 Chat", + "display_name": "GPT-5 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -59229,27 +68318,30 @@ }, "limit": { "context": 128000, - "output": 4000 + "output": 16384 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-24", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.15, - "output": 0.6 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "prime-intellect/intellect-3", - "name": "Prime Intellect: INTELLECT-3", - "display_name": "Prime Intellect: INTELLECT-3", + "id": "phi-4-mini", + "name": "Phi-4-mini", + "display_name": "Phi-4-mini", "modalities": { "input": [ "text" @@ -59259,129 +68351,176 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-11-26", - "last_updated": "2026-02-04", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.2, - "output": 1.1 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "nvidia/llama-3.3-nemotron-super-49b-v1.5", - "name": "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5", - "display_name": "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": false, "open_weights": false, - "release_date": "2025-03-16", - "last_updated": "2025-03-16", + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 0.1, - "output": 0.4 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-super-120b-a12b", - "name": "NVIDIA: Nemotron 3 Super", - "display_name": "NVIDIA: Nemotron 3 Super", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-11", - "last_updated": "2026-04-11", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.1, - "output": 0.5, - "cache_read": 0.1 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free", - "name": "NVIDIA: Nemotron 3 Nano Omni (free)", - "display_name": "NVIDIA: Nemotron 3 Nano Omni (free)", + "id": "gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ - "text", - "audio", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-28", - "last_updated": "2026-05-01", + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", "cost": { - "input": 0, - "output": 0 + "input": 60, + "output": 120 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-nano-30b-a3b", - "name": "NVIDIA: Nemotron 3 Nano 30B A3B", - "display_name": "NVIDIA: Nemotron 3 Nano 30B A3B", + "id": "phi-3-mini-4k-instruct", + "name": "Phi-3-mini-instruct (4k)", + "display_name": "Phi-3-mini-instruct (4k)", "modalities": { "input": [ "text" @@ -59391,61 +68530,62 @@ ] }, "limit": { - "context": 262144, - "output": 52429 + "context": 4096, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-12", - "last_updated": "2026-02-04", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.05, - "output": 0.2 + "input": 0.13, + "output": 0.52 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-super-120b-a12b:free", - "name": "NVIDIA: Nemotron 3 Super (free)", - "display_name": "NVIDIA: Nemotron 3 Super (free)", + "id": "llama-3.2-11b-vision-instruct", + "name": "Llama-3.2-11B-Vision-Instruct", + "display_name": "Llama-3.2-11B-Vision-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-03-12", - "last_updated": "2026-03-15", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0, - "output": 0 + "input": 0.37, + "output": 0.37 }, "type": "chat" }, { - "id": "nvidia/nemotron-nano-9b-v2", - "name": "NVIDIA: Nemotron Nano 9B V2", - "display_name": "NVIDIA: Nemotron Nano 9B V2", + "id": "ministral-3b", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ "text" @@ -59455,29 +68595,29 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-18", - "last_updated": "2025-08-18", + "knowledge": "2024-03", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { "input": 0.04, - "output": 0.16 + "output": 0.04 }, "type": "chat" }, { - "id": "nvidia/llama-3.1-nemotron-70b-instruct", - "name": "NVIDIA: Llama 3.1 Nemotron 70B Instruct", - "display_name": "NVIDIA: Llama 3.1 Nemotron 70B Instruct", + "id": "meta-llama-3-8b-instruct", + "name": "Meta-Llama-3-8B-Instruct", + "display_name": "Meta-Llama-3-8B-Instruct", "modalities": { "input": [ "text" @@ -59487,28 +68627,29 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-10-12", - "last_updated": "2024-10-12", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 1.2, - "output": 1.2 + "input": 0.3, + "output": 0.61 }, "type": "chat" }, { - "id": "inception/mercury-2", - "name": "Inception: Mercury 2", - "display_name": "Inception: Mercury 2", + "id": "gpt-4-32k", + "name": "GPT-4 32K", + "display_name": "GPT-4 32K", "modalities": { "input": [ "text" @@ -59518,30 +68659,29 @@ ] }, "limit": { - "context": 128000, - "output": 50000 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", "cost": { - "input": 0.25, - "output": 0.75, - "cache_read": 0.025 + "input": 60, + "output": 120 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-max", - "name": "OpenAI: GPT-5.1-Codex-Max", - "display_name": "OpenAI: GPT-5.1-Codex-Max", + "id": "mistral-medium-2505", + "name": "Mistral Medium 3", + "display_name": "Mistral Medium 3", "modalities": { "input": [ "text", @@ -59552,55 +68692,31 @@ ] }, "limit": { - "context": 400000, + "context": 128000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "openai/gpt-5.2-chat", - "name": "OpenAI: GPT-5.2 Chat", - "display_name": "OpenAI: GPT-5.2 Chat", + "id": "cohere-command-a", + "name": "Command A", + "display_name": "Command A", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -59608,29 +68724,30 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 256000, + "output": 8000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini-search-preview", - "name": "OpenAI: GPT-4o-mini Search Preview", - "display_name": "OpenAI: GPT-4o-mini Search Preview", + "id": "deepseek-v3.1", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ "text" @@ -59640,32 +68757,32 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-01", - "last_updated": "2025-01", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.56, + "output": 1.68 }, "type": "chat" }, { - "id": "openai/gpt-5-chat", - "name": "OpenAI: GPT-5 Chat", - "display_name": "OpenAI: GPT-5 Chat", + "id": "gpt-3.5-turbo-0613", + "name": "GPT-3.5 Turbo 0613", + "display_name": "GPT-3.5 Turbo 0613", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -59673,66 +68790,31 @@ ] }, "limit": { - "context": 128000, + "context": 16384, "output": 16384 }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2026-03-15", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, - "type": "chat" - }, - { - "id": "openai/gpt-4o-2024-05-13", - "name": "OpenAI: GPT-4o (2024-05-13)", - "display_name": "OpenAI: GPT-4o (2024-05-13)", - "modalities": { - "input": [ - "image", - "pdf", - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 4096 - }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2026-03-15", + "knowledge": "2021-08", + "release_date": "2023-06-13", + "last_updated": "2023-06-13", "cost": { - "input": 5, - "output": 15 + "input": 3, + "output": 4 }, "type": "chat" }, { - "id": "openai/gpt-5.3-chat", - "name": "OpenAI: GPT-5.3 Chat", - "display_name": "OpenAI: GPT-5.3 Chat", + "id": "cohere-embed-v3-english", + "name": "Embed v3 English", + "display_name": "Embed v3 English", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -59740,40 +68822,40 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 512, + "output": 1024 }, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-04", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "release_date": "2023-11-07", + "last_updated": "2023-11-07", "cost": { - "input": 1.75, - "output": 14 + "input": 0.1, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-5.2-pro", - "name": "OpenAI: GPT-5.2 Pro", - "display_name": "OpenAI: GPT-5.2 Pro", + "id": "o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -59786,14 +68868,8 @@ "supported": true, "default_enabled": true, "mode": "effort", - "effort": "high", + "effort": "medium", "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -59801,55 +68877,24 @@ "visibility": "hidden" } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2026-03-15", - "cost": { - "input": 21, - "output": 168 - }, - "type": "chat" - }, - { - "id": "openai/gpt-4-1106-preview", - "name": "OpenAI: GPT-4 Turbo (older v1106)", - "display_name": "OpenAI: GPT-4 Turbo (older v1106)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, "attachment": false, "open_weights": false, - "release_date": "2023-11-06", - "last_updated": "2026-03-15", + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 10, - "output": 30 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "openai/gpt-chat-latest", - "name": "OpenAI: GPT Chat Latest", - "display_name": "OpenAI: GPT Chat Latest", + "id": "codex-mini", + "name": "Codex Mini", + "display_name": "Codex Mini", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -59857,8 +68902,8 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -59866,74 +68911,68 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": true, "open_weights": false, - "release_date": "2026-05-05", - "last_updated": "2026-05-07", + "knowledge": "2024-04", + "release_date": "2025-05-16", + "last_updated": "2025-05-16", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5 + "input": 1.5, + "output": 6, + "cache_read": 0.375 }, "type": "chat" }, { - "id": "openai/gpt-4o-audio-preview", - "name": "OpenAI: GPT-4o Audio", - "display_name": "OpenAI: GPT-4o Audio", + "id": "llama-3.2-90b-vision-instruct", + "name": "Llama-3.2-90B-Vision-Instruct", + "display_name": "Llama-3.2-90B-Vision-Instruct", "modalities": { "input": [ - "audio", - "text" + "text", + "image" ], "output": [ - "audio", "text" ] }, "limit": { "context": 128000, - "output": 16384 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-15", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 2.5, - "output": 10 + "input": 2.04, + "output": 2.04 }, "type": "chat" }, { - "id": "openai/gpt-5.5", - "name": "OpenAI: GPT-5.5", - "display_name": "OpenAI: GPT-5.5", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -59942,43 +68981,32 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-05-01", + "attachment": false, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-12-02", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "OpenAI: GPT-5 Mini", - "display_name": "OpenAI: GPT-5 Mini", + "id": "mai-ds-r1", + "name": "MAI-DS-R1", + "display_name": "MAI-DS-R1", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -59986,63 +69014,41 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2026-03-15", + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "OpenAI: GPT-5 Nano", - "display_name": "OpenAI: GPT-5 Nano", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 272000, "output": 128000 }, "temperature": false, @@ -60074,48 +69080,53 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2024-05-30", "release_date": "2025-08-07", - "last_updated": "2026-03-15", + "last_updated": "2025-08-07", "cost": { "input": 0.05, "output": 0.4, - "cache_read": 0.005 + "cache_read": 0.01 }, "type": "chat" }, { - "id": "openai/gpt-5.3-codex", - "name": "OpenAI: GPT-5.3-Codex", - "display_name": "OpenAI: GPT-5.3-Codex", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ + "text", "image", - "text" + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 400000, + "context": 272000, "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ + "none", "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -60128,18 +69139,20 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-02-25", - "last_updated": "2026-03-15", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 1.75, - "output": 14 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo-16k", - "name": "OpenAI: GPT-3.5 Turbo 16k", - "display_name": "OpenAI: GPT-3.5 Turbo 16k", + "id": "gpt-3.5-turbo-1106", + "name": "GPT-3.5 Turbo 1106", + "display_name": "GPT-3.5 Turbo 1106", "modalities": { "input": [ "text" @@ -60149,28 +69162,61 @@ ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2023-08-28", - "last_updated": "2026-03-15", + "knowledge": "2021-08", + "release_date": "2023-11-06", + "last_updated": "2023-11-06", "cost": { - "input": 3, - "output": 4 + "input": 1, + "output": 2 }, "type": "chat" }, { - "id": "openai/gpt-4-turbo", - "name": "OpenAI: GPT-4 Turbo", - "display_name": "OpenAI: GPT-4 Turbo", + "id": "meta-llama-3-70b-instruct", + "name": "Meta-Llama-3-70B-Instruct", + "display_name": "Meta-Llama-3-70B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", + "cost": { + "input": 2.68, + "output": 3.54 + }, + "type": "chat" + }, + { + "id": "mistral-small-2503", + "name": "Mistral Small 3.1", + "display_name": "Mistral Small 3.1", "modalities": { "input": [ "text", @@ -60182,7 +69228,7 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -60191,79 +69237,54 @@ }, "attachment": true, "open_weights": false, - "release_date": "2023-09-13", - "last_updated": "2024-04-09", + "knowledge": "2024-09", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 10, - "output": 30 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "OpenAI: GPT-5.2", - "display_name": "OpenAI: GPT-5.2", + "id": "llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "display_name": "Llama 4 Scout 17B 16E Instruct", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2026-03-15", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.2, + "output": 0.78 }, "type": "chat" }, { - "id": "openai/o3-pro", - "name": "OpenAI: o3 Pro", - "display_name": "OpenAI: o3 Pro", + "id": "text-embedding-3-small", + "name": "text-embedding-3-small", + "display_name": "text-embedding-3-small", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -60271,46 +69292,29 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 8191, + "output": 1536 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2026-03-15", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 20, - "output": 80 + "input": 0.02, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "openai/o3-mini-high", - "name": "OpenAI: o3 Mini High", - "display_name": "OpenAI: o3 Mini High", + "id": "phi-3.5-mini-instruct", + "name": "Phi-3.5-mini-instruct", + "display_name": "Phi-3.5-mini-instruct", "modalities": { "input": [ - "pdf", "text" ], "output": [ @@ -60318,48 +69322,31 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.13, + "output": 0.52 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "OpenAI: GPT-4o-mini", - "display_name": "OpenAI: GPT-4o-mini", + "id": "phi-3.5-moe-instruct", + "name": "Phi-3.5-MoE-instruct", + "display_name": "Phi-3.5-MoE-instruct", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -60368,32 +69355,30 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 + "input": 0.16, + "output": 0.64 }, "type": "chat" }, { - "id": "openai/o4-mini-deep-research", - "name": "OpenAI: o4 Mini Deep Research", - "display_name": "OpenAI: o4 Mini Deep Research", + "id": "phi-3-small-8k-instruct", + "name": "Phi-3-small-instruct (8k)", + "display_name": "Phi-3-small-instruct (8k)", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -60401,105 +69386,62 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-06-26", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "openai/gpt-5.4-mini", - "name": "OpenAI: GPT-5.4 Mini", - "display_name": "OpenAI: GPT-5.4 Mini", + "id": "model-router", + "name": "Model Router", + "display_name": "Model Router", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16384 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-17", - "last_updated": "2026-04-11", + "release_date": "2025-05-19", + "last_updated": "2025-11-18", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 0.14, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-5.1-chat", - "name": "OpenAI: GPT-5.1 Chat", - "display_name": "OpenAI: GPT-5.1 Chat", + "id": "phi-3-small-128k-instruct", + "name": "Phi-3-small-instruct (128k)", + "display_name": "Phi-3-small-instruct (128k)", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -60508,41 +69450,43 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "OpenAI: o4 Mini", - "display_name": "OpenAI: o4 Mini", + "id": "gpt-5.1-chat", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 16384 }, "temperature": false, "tool_call": true, @@ -60550,39 +69494,24 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2026-03-15", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.275 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai/gpt-5.4-nano", - "name": "OpenAI: GPT-5.4 Nano", - "display_name": "OpenAI: GPT-5.4 Nano", + "id": "phi-4-reasoning", + "name": "Phi-4-reasoning", + "display_name": "Phi-4-reasoning", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -60590,52 +69519,30 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32000, + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-17", - "last_updated": "2026-04-11", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 0.125, + "output": 0.5 }, "type": "chat" }, { - "id": "openai/gpt-5.2-codex", - "name": "OpenAI: GPT-5.2-Codex", - "display_name": "OpenAI: GPT-5.2-Codex", + "id": "gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ "text", @@ -60662,10 +69569,10 @@ "mode": "effort", "effort": "medium", "effort_options": [ + "minimal", "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -60676,25 +69583,24 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini-2024-07-18", - "name": "OpenAI: GPT-4o-mini (2024-07-18)", - "display_name": "OpenAI: GPT-4o-mini (2024-07-18)", + "id": "gpt-3.5-turbo-instruct", + "name": "GPT-3.5 Turbo Instruct", + "display_name": "GPT-3.5 Turbo Instruct", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -60702,31 +69608,31 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 4096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2026-03-15", + "knowledge": "2021-08", + "release_date": "2023-09-21", + "last_updated": "2023-09-21", "cost": { - "input": 0.15, - "output": 0.6 + "input": 1.5, + "output": 2 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-mini", - "name": "OpenAI: GPT-5.1-Codex-Mini", - "display_name": "OpenAI: GPT-5.1-Codex-Mini", + "id": "phi-3-mini-128k-instruct", + "name": "Phi-3-mini-instruct (128k)", + "display_name": "Phi-3-mini-instruct (128k)", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -60734,55 +69640,31 @@ ] }, "limit": { - "context": 400000, - "output": 100000 + "context": 128000, + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.13, + "output": 0.52 }, "type": "chat" }, { - "id": "openai/gpt-4o-2024-08-06", - "name": "OpenAI: GPT-4o (2024-08-06)", - "display_name": "OpenAI: GPT-4o (2024-08-06)", + "id": "mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -60791,67 +69673,62 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-08-06", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "openai/gpt-5-image", - "name": "OpenAI: GPT-5 Image", - "display_name": "OpenAI: GPT-5 Image", + "id": "phi-4", + "name": "Phi-4", + "display_name": "Phi-4", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ - "image", "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-14", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 10, - "output": 10 + "input": 0.125, + "output": 0.5 }, "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "OpenAI: GPT-5.1", - "display_name": "OpenAI: GPT-5.1", + "id": "phi-3-medium-4k-instruct", + "name": "Phi-3-medium-instruct (4k)", + "display_name": "Phi-3-medium-instruct (4k)", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -60859,55 +69736,69 @@ ] }, "limit": { - "context": 400000, + "context": 4096, + "output": 1024 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "cost": { + "input": 0.17, + "output": 0.68 + }, + "type": "chat" + }, + { + "id": "deepseek-v3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.58, + "output": 1.68 }, "type": "chat" }, { - "id": "openai/o1", - "name": "OpenAI: o1", - "display_name": "OpenAI: o1", + "id": "codestral-2501", + "name": "Codestral 25.01", + "display_name": "Codestral 25.01", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -60915,48 +69806,31 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 256000, + "output": 256000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-12-05", - "last_updated": "2026-03-15", + "knowledge": "2024-03", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "openai/gpt-5.4-pro", - "name": "OpenAI: GPT-5.4 Pro", - "display_name": "OpenAI: GPT-5.4 Pro", + "id": "phi-3-medium-128k-instruct", + "name": "Phi-3-medium-instruct (128k)", + "display_name": "Phi-3-medium-instruct (128k)", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -60964,48 +69838,93 @@ ] }, "limit": { - "context": 1050000, + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "cost": { + "input": 0.17, + "output": 0.68 + }, + "type": "chat" + }, + { + "id": "deepseek-v3.2-speciale", + "name": "DeepSeek-V3.2-Speciale", + "display_name": "DeepSeek-V3.2-Speciale", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, "output": 128000 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "cost": { + "input": 0.58, + "output": 1.68 }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-06", - "last_updated": "2026-03-15", + "type": "chat" + }, + { + "id": "cohere-embed-v3-multilingual", + "name": "Embed v3 Multilingual", + "display_name": "Embed v3 Multilingual", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 512, + "output": 1024 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-11-07", + "last_updated": "2023-11-07", "cost": { - "input": 30, - "output": 180 + "input": 0.1, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo", - "name": "OpenAI: GPT-3.5 Turbo", - "display_name": "OpenAI: GPT-3.5 Turbo", + "id": "deepseek-v3-0324", + "name": "DeepSeek-V3-0324", + "display_name": "DeepSeek-V3-0324", "modalities": { "input": [ "text" @@ -61015,8 +69934,8 @@ ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -61024,23 +69943,22 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2023-03-01", - "last_updated": "2023-11-06", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 0.5, - "output": 1.5 + "input": 1.14, + "output": 4.56 }, "type": "chat" }, { - "id": "openai/o3-deep-research", - "name": "OpenAI: o3 Deep Research", - "display_name": "OpenAI: o3 Deep Research", + "id": "deepseek-r1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -61048,8 +69966,8 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, @@ -61060,58 +69978,62 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2024-06-26", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 10, - "output": 40, - "cache_read": 2.5 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "openai/o3-mini", - "name": "OpenAI: o3 Mini", - "display_name": "OpenAI: o3 Mini", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex Mini", + "display_name": "GPT-5.1 Codex Mini", "modalities": { "input": [ - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -61119,21 +70041,22 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-12-20", - "last_updated": "2026-03-15", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "openai/gpt-4-turbo-preview", - "name": "OpenAI: GPT-4 Turbo Preview", - "display_name": "OpenAI: GPT-4 Turbo Preview", + "id": "text-embedding-ada-002", + "name": "text-embedding-ada-002", + "display_name": "text-embedding-ada-002", "modalities": { "input": [ "text" @@ -61143,32 +70066,29 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2026-03-15", + "release_date": "2022-12-15", + "last_updated": "2022-12-15", "cost": { - "input": 10, - "output": 30 + "input": 0.1, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "openai/o1-pro", - "name": "OpenAI: o1-pro", - "display_name": "OpenAI: o1-pro", + "id": "o1-preview", + "name": "o1-preview", + "display_name": "o1-preview", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -61176,11 +70096,11 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 32768 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -61199,78 +70119,99 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-03-19", - "last_updated": "2026-03-15", + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 150, - "output": 600 + "input": 16.5, + "output": 66, + "cache_read": 8.25 }, "type": "chat" }, { - "id": "openai/gpt-5.4-image-2", - "name": "OpenAI: GPT-5.4 Image 2", - "display_name": "OpenAI: GPT-5.4 Image 2", + "id": "llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", "modalities": { "input": [ - "image", "text", - "pdf" + "image" ], "output": [ - "image", "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "cost": { + "input": 0.25, + "output": 1 + }, + "type": "chat" + }, + { + "id": "deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 163840, + "output": 163840 + }, + "temperature": true, "tool_call": false, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-21", - "last_updated": "2026-05-01", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 8, - "output": 15, - "cache_read": 2 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "openai/gpt-4", - "name": "OpenAI: GPT-4", - "display_name": "OpenAI: GPT-4", + "id": "meta-llama-3.1-70b-instruct", + "name": "Meta-Llama-3.1-70B-Instruct", + "display_name": "Meta-Llama-3.1-70B-Instruct", "modalities": { "input": [ "text" @@ -61280,8 +70221,8 @@ ] }, "limit": { - "context": 8191, - "output": 4096 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -61289,19 +70230,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2023-03-14", - "last_updated": "2024-04-09", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 30, - "output": 60 + "input": 2.68, + "output": 3.54 }, "type": "chat" }, { - "id": "openai/gpt-4-0314", - "name": "OpenAI: GPT-4 (older v0314)", - "display_name": "OpenAI: GPT-4 (older v0314)", + "id": "gpt-3.5-turbo-0125", + "name": "GPT-3.5 Turbo 0125", + "display_name": "GPT-3.5 Turbo 0125", "modalities": { "input": [ "text" @@ -61311,28 +70253,29 @@ ] }, "limit": { - "context": 8191, - "output": 4096 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2023-05-28", - "last_updated": "2026-03-15", + "knowledge": "2021-08", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 30, - "output": 60 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "openai/gpt-5-codex", - "name": "OpenAI: GPT-5 Codex", - "display_name": "OpenAI: GPT-5 Codex", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", @@ -61350,19 +70293,20 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ - "minimal", + "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -61375,110 +70319,90 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 1.25, - "output": 10, + "input": 1.75, + "output": 14, "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai/gpt-5.4", - "name": "OpenAI: GPT-5.4", - "display_name": "OpenAI: GPT-5.4", + "id": "gpt-4-turbo-vision", + "name": "GPT-4 Turbo Vision", + "display_name": "GPT-4 Turbo Vision", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 128000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-06", - "last_updated": "2026-03-15", + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 2.5, - "output": 15 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "openai/gpt-audio", - "name": "OpenAI: GPT Audio", - "display_name": "OpenAI: GPT Audio", + "id": "meta-llama-3.1-405b-instruct", + "name": "Meta-Llama-3.1-405B-Instruct", + "display_name": "Meta-Llama-3.1-405B-Instruct", "modalities": { "input": [ - "audio", "text" ], "output": [ - "audio", "text" ] }, "limit": { "context": 128000, - "output": 16384 + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-01-20", - "last_updated": "2026-03-15", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 2.5, - "output": 10 + "input": 5.33, + "output": 16 }, "type": "chat" }, { - "id": "openai/gpt-4o-search-preview", - "name": "OpenAI: GPT-4o Search Preview", - "display_name": "OpenAI: GPT-4o Search Preview", + "id": "phi-4-multimodal", + "name": "Phi-4-multimodal", + "display_name": "Phi-4-multimodal", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" @@ -61486,30 +70410,31 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-03-13", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 2.5, - "output": 10 + "input": 0.08, + "output": 0.32, + "input_audio": 4 }, "type": "chat" }, { - "id": "openai/gpt-4.1-nano", - "name": "OpenAI: GPT-4.1 Nano", - "display_name": "OpenAI: GPT-4.1 Nano", + "id": "gpt-3.5-turbo-0301", + "name": "GPT-3.5 Turbo 0301", + "display_name": "GPT-3.5 Turbo 0301", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -61517,33 +70442,31 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 4096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2026-03-15", + "knowledge": "2021-08", + "release_date": "2023-03-01", + "last_updated": "2023-03-01", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 1.5, + "output": 2 }, "type": "chat" }, { - "id": "openai/o4-mini-high", - "name": "OpenAI: o4 Mini High", - "display_name": "OpenAI: o4 Mini High", + "id": "phi-4-reasoning-plus", + "name": "Phi-4-reasoning-plus", + "display_name": "Phi-4-reasoning-plus", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -61551,46 +70474,32 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 32000, + "output": 4096 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-17", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 1.1, - "output": 4.4 + "input": 0.125, + "output": 0.5 }, "type": "chat" }, { - "id": "openai/o3", - "name": "OpenAI: o3", - "display_name": "OpenAI: o3", + "id": "mistral-large-2411", + "name": "Mistral Large 24.11", + "display_name": "Mistral Large 24.11", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -61598,44 +70507,29 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2026-03-15", + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { "input": 2, - "output": 8, - "cache_read": 0.5 + "output": 6 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "OpenAI: gpt-oss-20b", - "display_name": "OpenAI: gpt-oss-20b", + "id": "text-embedding-3-large", + "name": "text-embedding-3-large", + "display_name": "text-embedding-3-large", "modalities": { "input": [ "text" @@ -61645,8 +70539,39 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 8191, + "output": 3072 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-01-25", + "last_updated": "2024-01-25", + "cost": { + "input": 0.13, + "output": 0 + }, + "type": "embedding" + }, + { + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -61656,28 +70581,35 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-01", + "release_date": "2026-02-06", + "last_updated": "2026-02-06", "cost": { - "input": 0.03, - "output": 0.14 + "input": 0.6, + "output": 3 }, "type": "chat" }, { - "id": "openai/gpt-5-pro", - "name": "OpenAI: GPT-5 Pro", - "display_name": "OpenAI: GPT-5 Pro", + "id": "gpt-5.4-nano", + "name": "GPT-5.4 Nano", + "display_name": "GPT-5.4 Nano", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "pdf" ], "output": [ "text" @@ -61691,14 +70623,21 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], "verbosity": "medium", "verbosity_options": [ "low", @@ -61710,124 +70649,101 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-10-06", - "last_updated": "2026-03-15", - "cost": { - "input": 15, - "output": 120 - }, - "type": "chat" - }, - { - "id": "openai/gpt-audio-mini", - "name": "OpenAI: GPT Audio Mini", - "display_name": "OpenAI: GPT Audio Mini", - "modalities": { - "input": [ - "audio", - "text" - ], - "output": [ - "audio", - "text" - ] - }, - "limit": { - "context": 128000, - "output": 16384 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2026-01-20", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.6, - "output": 2.4 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "OpenAI: GPT-4o", - "display_name": "OpenAI: GPT-4o", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { "input": 2.5, - "output": 10, - "cache_read": 1.25 - }, - "type": "chat" - }, - { - "id": "openai/gpt-3.5-turbo-0613", - "name": "OpenAI: GPT-3.5 Turbo (older v0613)", - "display_name": "OpenAI: GPT-3.5 Turbo (older v0613)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" + "output": 15, + "cache_read": 0.25, + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + }, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } ] }, - "limit": { - "context": 4095, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2023-06-13", - "last_updated": "2023-06-13", - "cost": { - "input": 1, - "output": 2 - }, "type": "chat" }, { - "id": "openai/gpt-5-image-mini", - "name": "OpenAI: GPT-5 Image Mini", - "display_name": "OpenAI: GPT-5 Image Mini", + "id": "gpt-5.4-mini", + "name": "GPT-5.4 Mini", + "display_name": "GPT-5.4 Mini", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "pdf" ], "output": [ - "image", "text" ] }, @@ -61835,38 +70751,61 @@ "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-16", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 2.5, - "output": 2 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "openai/gpt-5", - "name": "OpenAI: GPT-5", - "display_name": "OpenAI: GPT-5", + "id": "gpt-5.4-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1050000, "output": 128000 }, "temperature": false, @@ -61880,12 +70819,11 @@ "supported": true, "default_enabled": true, "mode": "effort", - "effort": "medium", + "effort": "high", "effort_options": [ - "minimal", - "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -61898,52 +70836,82 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 30, + "output": 180, + "context_over_200k": { + "input": 60, + "output": 270 + }, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "openai/gpt-oss-safeguard-20b", - "name": "OpenAI: gpt-oss-safeguard-20b", - "display_name": "OpenAI: gpt-oss-safeguard-20b", + "id": "o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-10-29", - "last_updated": "2025-10-29", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.075, - "output": 0.3, - "cache_read": 0.037 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "OpenAI: gpt-oss-120b", - "display_name": "OpenAI: gpt-oss-120b", + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" @@ -61953,10 +70921,10 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -61964,36 +70932,46 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 0.039, - "output": 0.19 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "openai/gpt-5.5-pro", - "name": "OpenAI: GPT-5.5 Pro", - "display_name": "OpenAI: GPT-5.5 Pro", + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -62001,89 +70979,145 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-05-01", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 30, - "output": 180 + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo-instruct", - "name": "OpenAI: GPT-3.5 Turbo Instruct", - "display_name": "OpenAI: GPT-3.5 Turbo Instruct", + "id": "gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4095, - "output": 4096 + "context": 1047576, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2023-03-01", - "last_updated": "2023-09-21", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 1.5, - "output": 2 + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "OpenAI: GPT-4.1", - "display_name": "OpenAI: GPT-4.1", + "id": "gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2026-03-15", + "knowledge": "2025-12-01", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 5, + "output": 30, + "cache_read": 0.5, + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + }, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "OpenAI: GPT-4.1 Mini", - "display_name": "OpenAI: GPT-4.1 Mini", + "id": "cohere-command-r-08-2024", + "name": "Command R", + "display_name": "Command R", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -62091,29 +71125,29 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex", - "name": "OpenAI: GPT-5.1-Codex", - "display_name": "OpenAI: GPT-5.1-Codex", + "id": "gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ "text", @@ -62124,56 +71158,33 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "openai/gpt-4o-2024-11-20", - "name": "OpenAI: GPT-4o (2024-11-20)", - "display_name": "OpenAI: GPT-4o (2024-11-20)", + "id": "gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" @@ -62190,31 +71201,32 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-11-20", - "last_updated": "2026-03-15", + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "amazon/nova-lite-v1", - "name": "Amazon: Nova Lite 1.0", - "display_name": "Amazon: Nova Lite 1.0", + "id": "gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 5120 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -62223,18 +71235,20 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2026-03-15", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.06, - "output": 0.24 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "amazon/nova-pro-v1", - "name": "Amazon: Nova Pro 1.0", - "display_name": "Amazon: Nova Pro 1.0", + "id": "gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ "text", @@ -62245,40 +71259,57 @@ ] }, "limit": { - "context": 300000, - "output": 5120 + "context": 400000, + "output": 272000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 0.8, - "output": 3.2 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "amazon/nova-premier-v1", - "name": "Amazon: Nova Premier 1.0", - "display_name": "Amazon: Nova Premier 1.0", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -62287,56 +71318,56 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-11-01", - "last_updated": "2026-03-15", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 2.5, - "output": 12.5 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "amazon/nova-2-lite-v1", - "name": "Amazon: Nova 2 Lite", - "display_name": "Amazon: Nova 2 Lite", + "id": "cohere-command-r-plus-08-2024", + "name": "Command R+", + "display_name": "Command R+", "modalities": { "input": [ - "image", - "pdf", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65535 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0.3, - "output": 2.5 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "amazon/nova-micro-v1", - "name": "Amazon: Nova Micro 1.0", - "display_name": "Amazon: Nova Micro 1.0", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -62344,149 +71375,133 @@ }, "limit": { "context": 128000, - "output": 5120 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2026-03-15", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 0.035, - "output": 0.14 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" - }, + } + ] + }, + "ovhcloud": { + "id": "ovhcloud", + "name": "OVHcloud AI Endpoints", + "display_name": "OVHcloud AI Endpoints", + "api": "https://oai.endpoints.kepler.ai.cloud.ovh.net/v1", + "doc": "https://www.ovhcloud.com/en/public-cloud/ai-endpoints/catalog//", + "models": [ { - "id": "z-ai/glm-5v-turbo", - "name": "Z.ai: GLM 5V Turbo", - "display_name": "Z.ai: GLM 5V Turbo", + "id": "mistral-7b-instruct-v0.3", + "name": "Mistral-7B-Instruct-v0.3", + "display_name": "Mistral-7B-Instruct-v0.3", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-11", + "release_date": "2025-04-01", + "last_updated": "2025-04-01", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24 + "input": 0.11, + "output": 0.11 }, "type": "chat" }, { - "id": "z-ai/glm-4.7", - "name": "Z.ai: GLM 4.7", - "display_name": "Z.ai: GLM 4.7", + "id": "qwen2.5-vl-72b-instruct", + "name": "Qwen2.5-VL-72B-Instruct", + "display_name": "Qwen2.5-VL-72B-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-12-22", - "last_updated": "2026-03-15", + "release_date": "2025-03-31", + "last_updated": "2025-03-31", "cost": { - "input": 0.38, - "output": 1.98, - "cache_read": 0.2 + "input": 1.01, + "output": 1.01 }, "type": "chat" }, { - "id": "z-ai/glm-5", - "name": "Z.ai: GLM 5", - "display_name": "Z.ai: GLM 5", + "id": "mistral-small-3.2-24b-instruct-2506", + "name": "Mistral-Small-3.2-24B-Instruct-2506", + "display_name": "Mistral-Small-3.2-24B-Instruct-2506", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, + "context": 131072, "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-03-15", + "release_date": "2025-07-16", + "last_updated": "2025-07-16", "cost": { - "input": 0.72, - "output": 2.3 + "input": 0.1, + "output": 0.31 }, "type": "chat" }, { - "id": "z-ai/glm-4-32b", - "name": "Z.ai: GLM 4 32B ", - "display_name": "Z.ai: GLM 4 32B ", + "id": "mistral-nemo-instruct-2407", + "name": "Mistral-Nemo-Instruct-2407", + "display_name": "Mistral-Nemo-Instruct-2407", "modalities": { "input": [ "text" @@ -62496,8 +71511,8 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -62506,55 +71521,61 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-07-25", - "last_updated": "2026-03-15", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.14, + "output": 0.14 }, "type": "chat" }, { - "id": "z-ai/glm-5.1", - "name": "Z.ai: GLM 5.1", - "display_name": "Z.ai: GLM 5.1", + "id": "qwen3.5-9b", + "name": "Qwen3.5-9B", + "display_name": "Qwen3.5-9B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 1.26, - "output": 3.96 + "input": 0.1, + "output": 0.15 }, "type": "chat" }, { - "id": "z-ai/glm-4.5", - "name": "Z.ai: GLM 4.5", - "display_name": "Z.ai: GLM 4.5", + "id": "gpt-oss-20b", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ "text" @@ -62565,29 +71586,32 @@ }, "limit": { "context": 131072, - "output": 98304 + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2026-03-15", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.175 + "input": 0.05, + "output": 0.18 }, "type": "chat" }, { - "id": "z-ai/glm-4.5-air", - "name": "Z.ai: GLM 4.5 Air", - "display_name": "Z.ai: GLM 4.5 Air", + "id": "meta-llama-3_3-70b-instruct", + "name": "Meta-Llama-3_3-70B-Instruct", + "display_name": "Meta-Llama-3_3-70B-Instruct", "modalities": { "input": [ "text" @@ -62598,29 +71622,27 @@ }, "limit": { "context": 131072, - "output": 98304 + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-04-01", + "last_updated": "2025-04-01", "cost": { - "input": 0.13, - "output": 0.85, - "cache_read": 0.025 + "input": 0.74, + "output": 0.74 }, "type": "chat" }, { - "id": "z-ai/glm-5-turbo", - "name": "Z.ai: GLM 5 Turbo", - "display_name": "Z.ai: GLM 5 Turbo", + "id": "qwen3-32b", + "name": "Qwen3-32B", + "display_name": "Qwen3-32B", "modalities": { "input": [ "text" @@ -62630,8 +71652,8 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -62641,58 +71663,60 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2026-03-15", - "last_updated": "2026-04-11", + "release_date": "2025-07-16", + "last_updated": "2025-07-16", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24 + "input": 0.09, + "output": 0.25 }, "type": "chat" }, { - "id": "z-ai/glm-4.5v", - "name": "Z.ai: GLM 4.5V", - "display_name": "Z.ai: GLM 4.5V", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder-30B-A3B-Instruct", + "display_name": "Qwen3-Coder-30B-A3B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "release_date": "2025-10-28", + "last_updated": "2025-10-28", "cost": { - "input": 0.6, - "output": 1.8, - "cache_read": 0.11 + "input": 0.07, + "output": 0.26 }, "type": "chat" }, { - "id": "z-ai/glm-4.6", - "name": "Z.ai: GLM 4.6", - "display_name": "Z.ai: GLM 4.6", + "id": "gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ "text" @@ -62702,10 +71726,9 @@ ] }, "limit": { - "context": 204800, - "output": 204800 + "context": 131072, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -62718,24 +71741,21 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-09-30", - "last_updated": "2026-03-15", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0.39, - "output": 1.9, - "cache_read": 0.175 + "input": 0.09, + "output": 0.47 }, "type": "chat" }, { - "id": "z-ai/glm-4.6v", - "name": "Z.ai: GLM 4.6V", - "display_name": "Z.ai: GLM 4.6V", + "id": "llama-3.1-8b-instruct", + "name": "Llama-3.1-8B-Instruct", + "display_name": "Llama-3.1-8B-Instruct", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" @@ -62748,23 +71768,31 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-09-30", - "last_updated": "2026-01-10", + "release_date": "2025-06-11", + "last_updated": "2025-06-11", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.11, + "output": 0.11 }, "type": "chat" - }, + } + ] + }, + "friendli": { + "id": "friendli", + "name": "Friendli", + "display_name": "Friendli", + "api": "https://api.friendli.ai/serverless/v1", + "doc": "https://friendli.ai/docs/guides/serverless_endpoints/introduction", + "models": [ { - "id": "z-ai/glm-4.7-flash", - "name": "Z.ai: GLM 4.7 Flash", - "display_name": "Z.ai: GLM 4.7 Flash", + "id": "zai-org/GLM-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -62775,7 +71803,7 @@ }, "limit": { "context": 202752, - "output": 40551 + "output": 202752 }, "temperature": true, "tool_call": true, @@ -62785,27 +71813,32 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.06, - "output": 0.4, - "cache_read": 0.01 + "input": 1, + "output": 3.2, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-vl-424b-a47b", - "name": "Baidu: ERNIE 4.5 VL 424B A47B ", - "display_name": "Baidu: ERNIE 4.5 VL 424B A47B ", + "id": "zai-org/GLM-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -62813,32 +71846,43 @@ ] }, "limit": { - "context": 123000, - "output": 16000 + "context": 202752, + "output": 202752 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "release_date": "2025-06-30", - "last_updated": "2026-01", + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 0.42, - "output": 1.25 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "baidu/qianfan-ocr-fast:free", - "name": "Baidu: Qianfan-OCR-Fast (free)", - "display_name": "Baidu: Qianfan-OCR-Fast (free)", + "id": "meta-llama/Llama-3.1-8B-Instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -62846,29 +71890,28 @@ ] }, "limit": { - "context": 65536, - "output": 28672 + "context": 131072, + "output": 8000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-20", - "last_updated": "2026-05-01", + "attachment": false, + "open_weights": true, + "release_date": "2024-08-01", + "last_updated": "2025-12-23", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "baidu/cobuddy:free", - "name": "Baidu: CoBuddy (free)", - "display_name": "Baidu: CoBuddy (free)", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -62879,40 +71922,38 @@ }, "limit": { "context": 131072, - "output": 65536 + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-05-06", - "last_updated": "2026-05-07", + "open_weights": true, + "release_date": "2024-08-01", + "last_updated": "2025-12-23", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 0.6 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-vl-28b-a3b", - "name": "Baidu: ERNIE 4.5 VL 28B A3B", - "display_name": "Baidu: ERNIE 4.5 VL 28B A3B", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 30000, - "output": 8000 + "context": 196608, + "output": 196608 }, "temperature": true, "tool_call": true, @@ -62920,20 +71961,32 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "release_date": "2025-06-30", - "last_updated": "2025-06-30", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.14, - "output": 0.56 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-21b-a3b", - "name": "Baidu: ERNIE 4.5 21B A3B", - "display_name": "Baidu: ERNIE 4.5 21B A3B", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -62943,8 +71996,8 @@ ] }, "limit": { - "context": 120000, - "output": 8000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -62953,49 +72006,71 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-06-30", - "last_updated": "2025-06-30", + "release_date": "2025-07-29", + "last_updated": "2026-01-29", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.2, + "output": 0.8 }, "type": "chat" - }, + } + ] + }, + "regolo-ai": { + "id": "regolo-ai", + "name": "Regolo AI", + "display_name": "Regolo AI", + "api": "https://api.regolo.ai/v1", + "doc": "https://docs.regolo.ai/", + "models": [ { - "id": "baidu/ernie-4.5-300b-a47b", - "name": "Baidu: ERNIE 4.5 300B A47B ", - "display_name": "Baidu: ERNIE 4.5 300B A47B ", + "id": "qwen3.5-122b", + "name": "Qwen3.5-122B", + "display_name": "Qwen3.5-122B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 123000, - "output": 12000 + "context": 262144, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "release_date": "2025-06-30", - "last_updated": "2026-01", + "release_date": "2026-02-01", + "last_updated": "2026-02-01", "cost": { - "input": 0.28, - "output": 1.1 + "input": 0.9, + "output": 3.6 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-21b-a3b-thinking", - "name": "Baidu: ERNIE 4.5 21B A3B Thinking", - "display_name": "Baidu: ERNIE 4.5 21B A3B Thinking", + "id": "mistral-small3.2", + "name": "Mistral Small 3.2", + "display_name": "Mistral Small 3.2", "modalities": { "input": [ "text" @@ -63005,29 +72080,29 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 120000, + "output": 120000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "open_weights": false, + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.5, + "output": 2.2 }, "type": "chat" }, { - "id": "relace/relace-apply-3", - "name": "Relace: Relace Apply 3", - "display_name": "Relace: Relace Apply 3", + "id": "minimax-m2.5", + "name": "MiniMax 2.5", + "display_name": "MiniMax 2.5", "modalities": { "input": [ "text" @@ -63037,58 +72112,78 @@ ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 190000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-09-26", - "last_updated": "2026-03-15", + "release_date": "2026-03-10", + "last_updated": "2026-03-10", "cost": { - "input": 0.85, - "output": 1.25 + "input": 0.8, + "output": 3.5 }, "type": "chat" }, { - "id": "relace/relace-search", - "name": "Relace: Relace Search", - "display_name": "Relace: Relace Search", + "id": "qwen3.5-9b", + "name": "Qwen3.5-9B", + "display_name": "Qwen3.5-9B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 262144, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-12-09", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-02-01", + "last_updated": "2026-02-01", "cost": { - "input": 1, - "output": 3 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "minimax/minimax-m2.7", - "name": "MiniMax: MiniMax M2.7", - "display_name": "MiniMax: MiniMax M2.7", + "id": "gpt-oss-20b", + "name": "GPT-OSS-20B", + "display_name": "GPT-OSS-20B", "modalities": { "input": [ "text" @@ -63098,8 +72193,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -63109,30 +72204,23 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2026-03-01", + "last_updated": "2026-03-01", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.4, + "output": 1.8 }, "type": "chat" }, { - "id": "minimax/minimax-m2", - "name": "MiniMax: MiniMax M2", - "display_name": "MiniMax: MiniMax M2", + "id": "qwen3-coder-next", + "name": "Qwen3-Coder-Next", + "display_name": "Qwen3-Coder-Next", "modalities": { "input": [ "text" @@ -63142,8 +72230,8 @@ ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -63151,69 +72239,63 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": true, - "release_date": "2025-10-23", - "last_updated": "2026-03-15", + "release_date": "2026-03-01", + "last_updated": "2026-03-01", "cost": { - "input": 0.255, - "output": 1, - "cache_read": 0.03 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "minimax/minimax-01", - "name": "MiniMax: MiniMax-01", - "display_name": "MiniMax: MiniMax-01", + "id": "qwen3-embedding-8b", + "name": "Qwen3-Embedding-8B", + "display_name": "Qwen3-Embedding-8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000192, - "output": 1000192 + "context": 32768, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-01-15", - "last_updated": "2025-01-15", + "release_date": "2026-02-01", + "last_updated": "2026-02-01", "cost": { - "input": 0.2, - "output": 1.1 + "input": 0.1, + "output": 0.1 }, - "type": "chat" + "type": "embedding" }, { - "id": "minimax/minimax-m2.1", - "name": "MiniMax: MiniMax M2.1", - "display_name": "MiniMax: MiniMax M2.1", + "id": "mistral-small-4-119b", + "name": "Mistral Small 4 119B", + "display_name": "Mistral Small 4 119B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 39322 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -63221,26 +72303,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-15", + "last_updated": "2026-03-15", "cost": { - "input": 0.27, - "output": 0.95, - "cache_read": 0.03 + "input": 0.75, + "output": 3 }, "type": "chat" }, { - "id": "minimax/minimax-m1", - "name": "MiniMax: MiniMax M1", - "display_name": "MiniMax: MiniMax M1", + "id": "qwen3-reranker-4b", + "name": "Qwen3-Reranker-4B", + "display_name": "Qwen3-Reranker-4B", "modalities": { "input": [ "text" @@ -63250,29 +72326,28 @@ ] }, "limit": { - "context": 1000000, - "output": 40000 + "context": 32768, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "release_date": "2026-02-01", + "last_updated": "2026-02-01", "cost": { - "input": 0.4, - "output": 2.2 + "input": 0.12, + "output": 0.12 }, - "type": "chat" + "type": "rerank" }, { - "id": "minimax/minimax-m2-her", - "name": "MiniMax: MiniMax M2-her", - "display_name": "MiniMax: MiniMax M2-her", + "id": "llama-3.3-70b-instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -63282,28 +72357,28 @@ ] }, "limit": { - "context": 65536, - "output": 2048 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-23", - "last_updated": "2026-03-15", + "open_weights": false, + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.6, + "output": 2.7 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5", - "name": "MiniMax: MiniMax M2.5", - "display_name": "MiniMax: MiniMax M2.5", + "id": "gpt-oss-120b", + "name": "GPT-OSS-120B", + "display_name": "GPT-OSS-120B", "modalities": { "input": [ "text" @@ -63313,8 +72388,8 @@ ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -63328,20 +72403,50 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-03-15", + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.25, - "output": 1.2, - "cache_read": 0.029 + "input": 1, + "output": 4.2 }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b", - "name": "Qwen: Qwen3 235B A22B", - "display_name": "Qwen: Qwen3 235B A22B", + "id": "qwen-image", + "name": "Qwen-Image", + "display_name": "Qwen-Image", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 8192, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-01", + "last_updated": "2026-03-01", + "cost": { + "input": 0.5, + "output": 2 + }, + "type": "imageGeneration" + }, + { + "id": "llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ "text" @@ -63351,176 +72456,178 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 120000, + "output": 120000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-12-01", - "last_updated": "2026-03-15", + "open_weights": false, + "release_date": "2025-04-07", + "last_updated": "2025-04-07", "cost": { - "input": 0.455, - "output": 1.82, - "cache_read": 0.15 + "input": 0.05, + "output": 0.25 }, "type": "chat" - }, + } + ] + }, + "claudinio": { + "id": "claudinio", + "name": "Claudinio", + "display_name": "Claudinio", + "api": "https://api.claudin.io/v1", + "doc": "https://claudin.io", + "models": [ { - "id": "qwen/qwen3.5-122b-a10b", - "name": "Qwen: Qwen3.5-122B-A10B", - "display_name": "Qwen: Qwen3.5-122B-A10B", + "id": "claudinio", + "name": "Claudinio", + "display_name": "Claudinio", "modalities": { "input": [ - "image", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 256000, + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2026-05", + "release_date": "2026-05-12", + "last_updated": "2026-05-12", "cost": { - "input": 0.26, - "output": 2.08 + "input": 0.5, + "output": 2, + "cache_read": 0.05 }, "type": "chat" - }, + } + ] + }, + "orcarouter": { + "id": "orcarouter", + "name": "OrcaRouter", + "display_name": "OrcaRouter", + "api": "https://api.orcarouter.ai/v1", + "doc": "https://docs.orcarouter.ai", + "models": [ { - "id": "qwen/qwen3-coder-plus", - "name": "Qwen: Qwen3 Coder Plus", - "display_name": "Qwen: Qwen3 Coder Plus", + "id": "orcarouter/auto", + "name": "OrcaRouter Auto", + "display_name": "OrcaRouter Auto", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2026-05-14", "cost": { - "input": 0.65, - "output": 3.25, - "cache_read": 0.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwen3.6-27b", - "name": "Qwen: Qwen3.6 27B", - "display_name": "Qwen: Qwen3.6 27B", + "id": "grok/grok-4.3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 1000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + }, + "extra_capabilities": { + "reasoning": { + "supported": true } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-27", + "release_date": "2026-05-01", "last_updated": "2026-05-01", "cost": { - "input": 0.325, - "output": 3.25 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2, + "context_over_200k": { + "input": 2.5, + "output": 5, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 2.5, + "output": 5, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "qwen/qwen3.5-27b", - "name": "Qwen: Qwen3.5-27B", - "display_name": "Qwen: Qwen3.5-27B", + "id": "z-ai/glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -63539,20 +72646,22 @@ ] } }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": false, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.195, - "output": 1.56 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-2507", - "name": "Qwen: Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen: Qwen3 235B A22B Instruct 2507", + "id": "z-ai/glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ "text" @@ -63562,8 +72671,8 @@ ] }, "limit": { - "context": 262144, - "output": 52429 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -63573,18 +72682,21 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-04", - "last_updated": "2026-01", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.071, - "output": 0.1 + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen/qwen3-8b", - "name": "Qwen: Qwen3 8B", - "display_name": "Qwen: Qwen3 8B", + "id": "z-ai/glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -63594,8 +72706,8 @@ ] }, "limit": { - "context": 40960, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -63605,43 +72717,37 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "release_date": "2025-04", - "last_updated": "2026-03-15", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.05 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen/qwen3.5-397b-a17b", - "name": "Qwen: Qwen3.5 397B A17B", - "display_name": "Qwen: Qwen3.5 397B A17B", + "id": "z-ai/glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -63649,34 +72755,25 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-15", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.39, - "output": 2.34 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen/qwen-vl-plus", - "name": "Qwen: Qwen VL Plus", - "display_name": "Qwen: Qwen VL Plus", + "id": "z-ai/glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -63684,29 +72781,43 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.1365, - "output": 0.4095, - "cache_read": 0.042 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen/qwen3-32b", - "name": "Qwen: Qwen3 32B", - "display_name": "Qwen: Qwen3 32B", + "id": "z-ai/glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -63716,8 +72827,8 @@ ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -63738,84 +72849,112 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-12-01", - "last_updated": "2026-02-04", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.08, - "output": 0.24, - "cache_read": 0.04 + "input": 1, + "output": 3.2, + "cache_read": 0.2, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen/qwen2.5-vl-72b-instruct", - "name": "Qwen: Qwen2.5 VL 72B Instruct", - "display_name": "Qwen: Qwen2.5 VL 72B Instruct", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-02-01", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 0.8, - "output": 0.8, - "cache_read": 0.075 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "qwen/qwen-max", - "name": "Qwen: Qwen-Max ", - "display_name": "Qwen: Qwen-Max ", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-04-03", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 1.04, - "output": 4.16, - "cache_read": 0.32 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "qwen/qwen-plus", - "name": "Qwen: Qwen-Plus", - "display_name": "Qwen: Qwen-Plus", + "id": "openai/gpt-3.5-turbo", + "name": "GPT-3.5-turbo", + "display_name": "GPT-3.5-turbo", "modalities": { "input": [ "text" @@ -63825,144 +72964,136 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 16385, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2025-09-11", + "knowledge": "2021-09-01", + "release_date": "2023-03-01", + "last_updated": "2023-11-06", "cost": { - "input": 0.4, - "output": 1.2, - "cache_read": 0.08 + "input": 0.5, + "output": 1.5, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "qwen/qwen3.6-35b-a3b", - "name": "Qwen: Qwen3.6 35B A3B", - "display_name": "Qwen: Qwen3.6 35B A3B", + "id": "openai/gpt-5.4-nano", + "name": "GPT-5.4 nano", + "display_name": "GPT-5.4 nano", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-27", - "last_updated": "2026-05-01", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.1612, - "output": 0.96525, - "cache_read": 0.1612 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-235b-a22b-thinking", - "name": "Qwen: Qwen3 VL 235B A22B Thinking", - "display_name": "Qwen: Qwen3 VL 235B A22B Thinking", + "id": "openai/gpt-5-chat-latest", + "name": "GPT-5 Chat (latest)", + "display_name": "GPT-5 Chat (latest)", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, - "open_weights": true, - "release_date": "2025-09-24", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.26, - "output": 2.6 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-30b-a3b-thinking", - "name": "Qwen: Qwen3 VL 30B A3B Thinking", - "display_name": "Qwen: Qwen3 VL 30B A3B Thinking", + "id": "openai/gpt-5.5-pro", + "name": "GPT-5.5 Pro", + "display_name": "GPT-5.5 Pro", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -63970,120 +73101,108 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": true, - "open_weights": true, - "release_date": "2025-10-11", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0.13, - "output": 1.56 - }, - "type": "chat" - }, - { - "id": "qwen/qwen3-vl-8b-instruct", - "name": "Qwen: Qwen3 VL 8B Instruct", - "display_name": "Qwen: Qwen3 VL 8B Instruct", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "text" + "input": 30, + "output": 180, + "context_over_200k": { + "input": 60, + "output": 270 + }, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } ] }, - "limit": { - "context": 131072, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", - "cost": { - "input": 0.08, - "output": 0.5 - }, "type": "chat" }, { - "id": "qwen/qwen3.5-flash-02-23", - "name": "Qwen: Qwen3.5-Flash", - "display_name": "Qwen: Qwen3.5-Flash", + "id": "openai/gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex mini", + "display_name": "GPT-5.1 Codex mini", "modalities": { "input": [ - "image", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "qwen/qwen3.6-plus", - "name": "Qwen: Qwen3.6 Plus", - "display_name": "Qwen: Qwen3.6 Plus", + "id": "openai/gpt-5.2-pro", + "name": "GPT-5.2 Pro", + "display_name": "GPT-5.2 Pro", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -64092,158 +73211,174 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2026-04-11", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.325, - "output": 1.95, - "cache_read": 0.0325, - "cache_write": 0.40625 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "qwen/qwen3-max", - "name": "Qwen: Qwen3 Max", - "display_name": "Qwen: Qwen3 Max", + "id": "openai/gpt-4o-2024-05-13", + "name": "GPT-4o (2024-05-13)", + "display_name": "GPT-4o (2024-05-13)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-05", - "last_updated": "2026-03-15", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 1.2, - "output": 6, - "cache_read": 0.24 + "input": 5, + "output": 15 }, "type": "chat" }, { - "id": "qwen/qwen-plus-2025-07-28", - "name": "Qwen: Qwen Plus 0728", - "display_name": "Qwen: Qwen Plus 0728", + "id": "openai/gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "release_date": "2025-09-09", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.26, - "output": 0.78 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b-instruct-2507", - "name": "Qwen: Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen: Qwen3 30B A3B Instruct 2507", + "id": "openai/gpt-5.1-chat-latest", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-29", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.09, - "output": 0.3, - "cache_read": 0.04 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-32b-instruct", - "name": "Qwen: Qwen3 VL 32B Instruct", - "display_name": "Qwen: Qwen3 VL 32B Instruct", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 1047576, "output": 32768 }, "temperature": true, @@ -64253,31 +73388,34 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-10-21", - "last_updated": "2025-11-25", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.104, - "output": 0.416 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-thinking-2507", - "name": "Qwen: Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen: Qwen3 235B A22B Thinking 2507", + "id": "openai/gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 272000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -64286,393 +73424,576 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-25", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 0.11, - "output": 0.6 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "qwen/qwen3-next-80b-a3b-thinking", - "name": "Qwen: Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen: Qwen3 Next 80B A3B Thinking", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 1047576, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-11", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.0975, - "output": 0.78 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b-thinking-2507", - "name": "Qwen: Qwen3 30B A3B Thinking 2507", - "display_name": "Qwen: Qwen3 30B A3B Thinking 2507", + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 6554 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.051, - "output": 0.34 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "qwen/qwen-2.5-7b-instruct", - "name": "Qwen: Qwen2.5 7B Instruct", - "display_name": "Qwen: Qwen2.5 7B Instruct", + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 6554 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-09", - "last_updated": "2025-04-16", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.04, - "output": 0.1 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "qwen/qwen-vl-max", - "name": "Qwen: Qwen VL Max", - "display_name": "Qwen: Qwen VL Max", + "id": "openai/gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2024-04-08", - "last_updated": "2025-08-13", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.8, - "output": 3.2 + "input": 5, + "output": 22.5, + "cache_read": 0.25, + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + }, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "qwen/qwen3-coder-flash", - "name": "Qwen: Qwen3 Coder Flash", - "display_name": "Qwen: Qwen3 Coder Flash", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-23", - "last_updated": "2026-03-15", + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.195, - "output": 0.975, - "cache_read": 0.06 + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b", - "name": "Qwen: Qwen3 30B A3B", - "display_name": "Qwen: Qwen3 30B A3B", + "id": "openai/gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0.08, - "output": 0.28, - "cache_read": 0.03 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "qwen/qwen3-next-80b-a3b-instruct", - "name": "Qwen: Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen: Qwen3 Next 80B A3B Instruct", + "id": "openai/gpt-5.4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 52429 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-11", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.09, - "output": 1.1 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "qwen/qwen3.5-plus-20260420", - "name": "Qwen: Qwen3.5 Plus 2026-04-20", - "display_name": "Qwen: Qwen3.5 Plus 2026-04-20", + "id": "openai/gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-27", - "last_updated": "2026-05-01", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.4, - "output": 2.4 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen/qwen3-coder-next", - "name": "Qwen: Qwen3 Coder Next", - "display_name": "Qwen: Qwen3 Coder Next", + "id": "openai/gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-02", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0.12, - "output": 0.75, - "cache_read": 0.035 + "input": 5, + "output": 30, + "cache_read": 0.5, + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + }, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "qwen/qwen-2.5-coder-32b-instruct", - "name": "Qwen2.5 Coder 32B Instruct", - "display_name": "Qwen2.5 Coder 32B Instruct", + "id": "openai/gpt-5.4-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 1050000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-11-11", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.2, - "output": 0.2, - "cache_read": 0.015 + "input": 60, + "output": 270, + "context_over_200k": { + "input": 60, + "output": 270 + }, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "qwen/qwen3-vl-30b-a3b-instruct", - "name": "Qwen: Qwen3 VL 30B A3B Instruct", - "display_name": "Qwen: Qwen3 VL 30B A3B Instruct", + "id": "openai/gpt-5.2-chat-latest", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ "text", @@ -64683,38 +74004,42 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-10-05", - "last_updated": "2025-11-25", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.13, - "output": 0.52 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "qwen/qwen3-coder-30b-a3b-instruct", - "name": "Qwen: Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen: Qwen3 Coder 30B A3B Instruct", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 160000, + "context": 1047576, "output": 32768 }, "temperature": true, @@ -64722,20 +74047,22 @@ "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-31", - "last_updated": "2025-07-31", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.07, - "output": 0.27 + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "qwen/qwen3-max-thinking", - "name": "Qwen: Qwen3 Max Thinking", - "display_name": "Qwen: Qwen3 Max Thinking", + "id": "openai/gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ "text" @@ -64745,83 +74072,85 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-01-23", - "last_updated": "2026-03-15", + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0.78, - "output": 3.9 + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "qwen/qwen-turbo", - "name": "Qwen: Qwen-Turbo", - "display_name": "Qwen: Qwen-Turbo", + "id": "openai/gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-11-01", - "last_updated": "2026-03-15", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.0325, - "output": 0.13, - "cache_read": 0.01 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-235b-a22b-instruct", - "name": "Qwen: Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen: Qwen3 VL 235B A22B Instruct", + "id": "openai/gpt-4o-2024-11-20", + "name": "GPT-4o (2024-11-20)", + "display_name": "GPT-4o (2024-11-20)", "modalities": { "input": [ "text", @@ -64832,8 +74161,8 @@ ] }, "limit": { - "context": 262144, - "output": 52429 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -64841,67 +74170,92 @@ "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-09-23", - "last_updated": "2026-01-10", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", "cost": { - "input": 0.2, - "output": 0.88, - "cache_read": 0.11 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "qwen/qwen3-coder", - "name": "Qwen: Qwen3 Coder 480B A35B", - "display_name": "Qwen: Qwen3 Coder 480B A35B", + "id": "openai/gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 52429 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.22, - "output": 1, - "cache_read": 0.022 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "qwen/qwen3.5-9b", - "name": "Qwen: Qwen3.5-9B", - "display_name": "Qwen: Qwen3.5-9B", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "image", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -64910,42 +74264,55 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2026-03-10", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.05, - "output": 0.15 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-8b-thinking", - "name": "Qwen: Qwen3 VL 8B Thinking", - "display_name": "Qwen: Qwen3 VL 8B Thinking", + "id": "openai/gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -64954,114 +74321,141 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.117, - "output": 1.365 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "qwen/qwen3.6-max-preview", - "name": "Qwen: Qwen3.6 Max Preview", - "display_name": "Qwen: Qwen3.6 Max Preview", + "id": "openai/gpt-4o-2024-08-06", + "name": "GPT-4o (2024-08-06)", + "display_name": "GPT-4o (2024-08-06)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-04-27", - "last_updated": "2026-05-01", + "knowledge": "2023-09", + "release_date": "2024-08-06", + "last_updated": "2024-08-06", "cost": { - "input": 1.04, - "output": 6.24, - "cache_write": 1.3 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "qwen/qwen-plus-2025-07-28:thinking", - "name": "Qwen: Qwen Plus 0728 (thinking)", - "display_name": "Qwen: Qwen Plus 0728 (thinking)", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-09", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.26, - "output": 0.78 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen/qwen-2.5-72b-instruct", - "name": "Qwen2.5 72B Instruct", - "display_name": "Qwen2.5 72B Instruct", + "id": "openai/gpt-5.3-chat-latest", + "name": "GPT-5.3 Chat (latest)", + "display_name": "GPT-5.3 Chat (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 128000, "output": 16384 }, "temperature": true, @@ -65069,33 +74463,37 @@ "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-09", - "last_updated": "2026-01-10", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.12, - "output": 0.39 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "qwen/qwen3-14b", - "name": "Qwen: Qwen3 14B", - "display_name": "Qwen: Qwen3 14B", + "id": "kimi/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -65114,23 +74512,24 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-04", - "last_updated": "2026-03-15", + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.06, - "output": 0.24, - "cache_read": 0.025 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "qwen/qwen3.5-35b-a3b", - "name": "Qwen: Qwen3.5-35B-A3B", - "display_name": "Qwen: Qwen3.5-35B-A3B", + "id": "kimi/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "image", "text", + "image", "video" ], "output": [ @@ -65139,7 +74538,7 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 262144 }, "temperature": true, "tool_call": true, @@ -65160,31 +74559,31 @@ }, "attachment": true, "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-03-15", + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.1625, - "output": 1.3 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "qwen/qwen3.5-plus-02-15", - "name": "Qwen: Qwen3.5 Plus 2026-02-15", - "display_name": "Qwen: Qwen3.5 Plus 2026-02-15", + "id": "minimax/minimax-m2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -65203,33 +74602,33 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-15", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.26, - "output": 1.56 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "qwen/qwen3.6-flash", - "name": "Qwen: Qwen3.6 Flash", - "display_name": "Qwen: Qwen3.6 Flash", + "id": "minimax/minimax-m2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -65239,30 +74638,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-27", - "last_updated": "2026-05-01", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.25, - "output": 1.5, - "cache_write": 0.3125 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "alfredpros/codellama-7b-instruct-solidity", - "name": "AlfredPros: CodeLLaMa 7B Instruct Solidity", - "display_name": "AlfredPros: CodeLLaMa 7B Instruct Solidity", + "id": "minimax/minimax-m2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ "text" @@ -65272,28 +74666,42 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2025-04-14", - "last_updated": "2026-03-15", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.8, - "output": 1.2 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "kwaipilot/kat-coder-pro-v2", - "name": "Kwaipilot: KAT-Coder-Pro V2", - "display_name": "Kwaipilot: KAT-Coder-Pro V2", + "id": "minimax/minimax-m2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "display_name": "MiniMax-M2.5-highspeed", "modalities": { "input": [ "text" @@ -65303,381 +74711,449 @@ ] }, "limit": { - "context": 256000, - "output": 80000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-04-11", + "release_date": "2026-02-13", + "last_updated": "2026-02-13", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro-preview-05-06", - "name": "Google: Gemini 2.5 Pro Preview 05-06", - "display_name": "Google: Gemini 2.5 Pro Preview 05-06", + "id": "anthropic/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", + "default_enabled": false, + "mode": "mixed", "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, + "min": 1024, "unit": "tokens" }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-05-06", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 1.25, - "output": 10, - "reasoning": 10, - "cache_read": 0.125, - "cache_write": 0.375 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "google/lyria-3-clip-preview", - "name": "Google: Lyria 3 Clip Preview", - "display_name": "Google: Lyria 3 Clip Preview", + "id": "anthropic/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ - "audio", "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2026-03-30", - "last_updated": "2026-04-11", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "google/gemini-3.1-pro-preview-customtools", - "name": "Google: Gemini 3.1 Pro Preview Custom Tools", - "display_name": "Google: Gemini 3.1 Pro Preview Custom Tools", + "id": "anthropic/claude-opus-4.6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ "low", + "medium", "high" ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-26", - "last_updated": "2026-03-15", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 2, - "output": 12, - "reasoning": 12 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-lite-preview-09-2025", - "name": "Google: Gemini 2.5 Flash Lite Preview 09-2025", - "display_name": "Google: Gemini 2.5 Flash Lite Preview 09-2025", + "id": "anthropic/claude-opus-4.1", + "name": "Claude Opus 4.1 (latest)", + "display_name": "Claude Opus 4.1 (latest)", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "type": "chat" + }, + { + "id": "anthropic/claude-opus-4", + "name": "Claude Opus 4 (latest)", + "display_name": "Claude Opus 4 (latest)", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2026-03-15", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.1, - "output": 0.4, - "reasoning": 0.4, - "cache_read": 0.01, - "cache_write": 0.083333 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "google/gemini-2.0-flash-001", - "name": "Google: Gemini 2.0 Flash", - "display_name": "Google: Gemini 2.0 Flash", + "id": "anthropic/claude-haiku-4.5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2024-12-11", - "last_updated": "2026-03-15", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025, - "cache_write": 0.083333 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "google/lyria-3-pro-preview", - "name": "Google: Lyria 3 Pro Preview", - "display_name": "Google: Lyria 3 Pro Preview", + "id": "anthropic/claude-opus-4.5", + "name": "Claude Opus 4.5 (latest)", + "display_name": "Claude Opus 4.5 (latest)", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ - "audio", "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2026-03-30", - "last_updated": "2026-04-11", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "google/gemma-3n-e4b-it", - "name": "Google: Gemma 3n 4B", - "display_name": "Google: Gemma 3n 4B", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4 (latest)", + "display_name": "Claude Sonnet 4 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 6554 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.02, - "output": 0.04 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-lite-preview", - "name": "Google: Gemini 3.1 Flash Lite Preview", - "display_name": "Google: Gemini 3.1 Flash Lite Preview", + "id": "anthropic/claude-opus-4.7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-03-03", - "last_updated": "2026-03-15", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.25, - "output": 1.5, - "reasoning": 1.5 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "google/gemini-3.1-pro-preview", - "name": "Google: Gemini 3.1 Pro Preview", - "display_name": "Google: Gemini 3.1 Pro Preview", + "id": "qwen/qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", + "image", "video" ], "output": [ @@ -65685,7 +75161,7 @@ ] }, "limit": { - "context": 1048576, + "context": 1000000, "output": 65536 }, "temperature": true, @@ -65697,49 +75173,43 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-02-19", - "last_updated": "2026-03-15", + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 2, - "output": 12, - "reasoning": 12 + "input": 0.115, + "output": 0.688, + "reasoning": 2.4 }, "type": "chat" }, { - "id": "google/gemini-3-flash-preview", - "name": "Google: Gemini 3 Flash Preview", - "display_name": "Google: Gemini 3 Flash Preview", + "id": "qwen/qwen3.5-122b-a10b", + "name": "Qwen3.5 122B-A10B", + "display_name": "Qwen3.5 122B-A10B", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, @@ -65751,113 +75221,88 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, - "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2026-03-15", + "open_weights": true, + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 0.5, - "output": 3, - "reasoning": 3, - "cache_read": 0.05, - "cache_write": 0.083333 + "input": 0.115, + "output": 0.917 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "Google: Gemini 2.5 Pro", - "display_name": "Google: Gemini 2.5 Pro", + "id": "qwen/qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "audio", - "image", - "pdf", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-03-20", - "last_updated": "2026-03-15", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 1.25, - "output": 10, - "reasoning": 10, - "cache_read": 0.125, - "cache_write": 0.375 + "input": 0.359, + "output": 1.434 }, "type": "chat" }, { - "id": "google/gemini-3-pro-image-preview", - "name": "Google: Nano Banana Pro (Gemini 3 Pro Image Preview)", - "display_name": "Google: Nano Banana Pro (Gemini 3 Pro Image Preview)", + "id": "qwen/qwen3.5-397b-a17b", + "name": "Qwen3.5 397B-A17B", + "display_name": "Qwen3.5 397B-A17B", "modalities": { "input": [ + "text", "image", - "text" + "video", + "audio" ], "output": [ - "image", "text" ] }, "limit": { - "context": 65536, - "output": 32768 + "context": 262144, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -65865,39 +75310,32 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, - "open_weights": false, - "release_date": "2025-11-20", - "last_updated": "2026-03-15", + "open_weights": true, + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 2, - "output": 12, - "reasoning": 12 + "input": 0.172, + "output": 1.032 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "google/gemma-4-31b-it", - "name": "Google: Gemma 4 31B", - "display_name": "Google: Gemma 4 31B", + "id": "qwen/qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ - "image", "text", + "image", "video" ], "output": [ @@ -65905,8 +75343,8 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -65914,101 +75352,158 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-04", "release_date": "2026-04-02", - "last_updated": "2026-04-11", + "last_updated": "2026-04-02", "cost": { - "input": 0.14, - "output": 0.4 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 0.625, + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5 + }, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5, + "tier": { + "type": "context", + "size": 256000 + } + } + ] }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-image", - "name": "Google: Nano Banana (Gemini 2.5 Flash Image)", - "display_name": "Google: Nano Banana (Gemini 2.5 Flash Image)", + "id": "qwen/qwen3.5-35b-a3b", + "name": "Qwen3.5 35B-A3B", + "display_name": "Qwen3.5 35B-A3B", "modalities": { "input": [ + "text", "image", - "text" + "video", + "audio" ], "output": [ - "image", "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 262144, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "release_date": "2025-10-08", - "last_updated": "2026-03-15", + "open_weights": true, + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 0.3, - "output": 2.5 + "input": 0.057, + "output": 0.459 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "google/gemma-3-12b-it", - "name": "Google: Gemma 3 12B", - "display_name": "Google: Gemma 3 12B", + "id": "qwen/qwen3.6-35b-a3b", + "name": "Qwen3.6 35B-A3B", + "display_name": "Qwen3.6 35B-A3B", "modalities": { "input": [ + "text", "image", - "text" + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": true, - "release_date": "2025-03-13", - "last_updated": "2026-03-15", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.04, - "output": 0.13, - "cache_read": 0.015 + "input": 0.248, + "output": 1.485 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Google: Gemini 2.5 Flash", - "display_name": "Google: Gemini 2.5 Flash", + "id": "qwen/qwen3.5-27b", + "name": "Qwen3.5 27B", + "display_name": "Qwen3.5 27B", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -66019,117 +75514,107 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, - "open_weights": false, - "release_date": "2025-07-17", - "last_updated": "2026-03-15", + "open_weights": true, + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 0.3, - "output": 2.5, - "reasoning": 2.5, - "cache_read": 0.03, - "cache_write": 0.083333 + "input": 0.086, + "output": 0.688 }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-image-preview", - "name": "Google: Nano Banana 2 (Gemini 3.1 Flash Image Preview)", - "display_name": "Google: Nano Banana 2 (Gemini 3.1 Flash Image Preview)", + "id": "google/gemini-flash-latest", + "name": "Gemini Flash Latest", + "display_name": "Gemini Flash Latest", "modalities": { "input": [ + "text", "image", - "text" + "audio", + "video", + "pdf" ], "output": [ - "image", "text" ] }, "limit": { - "context": 65536, + "context": 1048576, "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": true, "open_weights": false, - "release_date": "2026-02-26", - "last_updated": "2026-03-15", + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { "input": 0.5, - "output": 3 + "output": 3, + "cache_read": 0.075, + "input_audio": 1 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "google/gemma-3-4b-it", - "name": "Google: Gemma 3 4B", - "display_name": "Google: Gemma 3 4B", + "id": "google/gemma-4-26b-a4b-it", + "name": "Gemma 4 26B", + "display_name": "Gemma 4 26B", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 19200 + "context": 256000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-03-13", - "last_updated": "2026-03-15", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.04, - "output": 0.08 + "input": 0.06, + "output": 0.33 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro-preview", - "name": "Google: Gemini 2.5 Pro Preview 06-05", - "display_name": "Google: Gemini 2.5 Pro Preview 06-05", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "audio", + "text", "image", - "pdf", - "text" + "audio", + "video", + "pdf" ], "output": [ "text" @@ -66166,98 +75651,48 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2026-03-15", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 1.25, - "output": 10, - "reasoning": 10, + "input": 2.5, + "output": 15, "cache_read": 0.125, - "cache_write": 0.375 - }, - "type": "chat" - }, - { - "id": "google/gemma-2-27b-it", - "name": "Google: Gemma 2 27B", - "display_name": "Google: Gemma 2 27B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 2048 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-06-24", - "last_updated": "2024-06-24", - "cost": { - "input": 0.65, - "output": 0.65 - }, - "type": "chat" - }, - { - "id": "google/gemma-3-27b-it", - "name": "Google: Gemma 3 27B", - "display_name": "Google: Gemma 3 27B", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "text" + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + }, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } ] }, - "limit": { - "context": 128000, - "output": 65536 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2025-03-12", - "last_updated": "2026-03-15", - "cost": { - "input": 0.03, - "output": 0.11, - "cache_read": 0.02 - }, "type": "chat" }, { - "id": "google/gemma-4-26b-a4b-it", - "name": "Google: Gemma 4 26B A4B", - "display_name": "Google: Gemma 4 26B A4B", + "id": "google/gemma-4-31b-it", + "name": "Gemma 4 31B", + "display_name": "Gemma 4 31B", "modalities": { "input": [ - "image", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -66265,27 +75700,27 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-03", - "last_updated": "2026-04-11", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.12, - "output": 0.4 + "input": 0.13, + "output": 0.38 }, "type": "chat" }, { "id": "google/gemini-2.5-flash-lite", - "name": "Google: Gemini 2.5 Flash Lite", - "display_name": "Google: Gemini 2.5 Flash Lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" @@ -66293,7 +75728,7 @@ }, "limit": { "context": 1048576, - "output": 65535 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -66322,28 +75757,28 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-01", "release_date": "2025-06-17", - "last_updated": "2026-03-15", + "last_updated": "2025-06-17", "cost": { "input": 0.1, "output": 0.4, - "reasoning": 0.4, "cache_read": 0.01, - "cache_write": 0.083333 + "input_audio": 0.3 }, "type": "chat" }, { - "id": "google/gemini-2.0-flash-lite-001", - "name": "Google: Gemini 2.0 Flash Lite", - "display_name": "Google: Gemini 2.0 Flash Lite", + "id": "google/gemini-flash-lite-latest", + "name": "Gemini Flash-Lite Latest", + "display_name": "Gemini Flash-Lite Latest", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" @@ -66351,39 +75786,45 @@ }, "limit": { "context": 1048576, - "output": 8192 + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2024-12-11", - "last_updated": "2026-03-15", + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.075, - "output": 0.3 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.5", - "name": "MoonshotAI: Kimi K2.5", - "display_name": "MoonshotAI: Kimi K2.5", + "id": "google/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ + "text", "image", - "text" + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65535 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -66394,72 +75835,67 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, - "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.45, - "output": 2.2 - }, - "type": "chat" - }, - { - "id": "moonshotai/kimi-k2-0905", - "name": "MoonshotAI: Kimi K2 0905", - "display_name": "MoonshotAI: Kimi K2 0905", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" + "input": 4, + "output": 18, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } ] }, - "limit": { - "context": 131072, - "output": 26215 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-05", - "last_updated": "2025-09-05", - "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.15 - }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.6", - "name": "MoonshotAI: Kimi K2.6", - "display_name": "MoonshotAI: Kimi K2.6", + "id": "google/gemini-3.1-pro-preview-customtools", + "name": "Gemini 3.1 Pro Preview Custom Tools", + "display_name": "Gemini 3.1 Pro Preview Custom Tools", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -66470,71 +75906,111 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-20", - "last_updated": "2026-04-20", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 4, + "output": 18, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "moonshotai/kimi-k2", - "name": "MoonshotAI: Kimi K2 0711", - "display_name": "MoonshotAI: Kimi K2 0711", + "id": "google/gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 26215 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-11", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.55, - "output": 2.2 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "MoonshotAI: Kimi K2 Thinking", - "display_name": "MoonshotAI: Kimi K2 Thinking", + "id": "google/gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65535 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -66545,187 +76021,169 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-11-06", - "last_updated": "2026-03-15", - "cost": { - "input": 0.47, - "output": 2, - "cache_read": 0.2 - }, - "type": "chat" - }, - { - "id": "aion-labs/aion-1.0", - "name": "AionLabs: Aion-1.0", - "display_name": "AionLabs: Aion-1.0", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 32768 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2026-03-15", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { "input": 4, - "output": 8 - }, - "type": "chat" - }, - { - "id": "aion-labs/aion-rp-llama-3.1-8b", - "name": "AionLabs: Aion-RP 1.0 (8B)", - "display_name": "AionLabs: Aion-RP 1.0 (8B)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" + "output": 18, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } ] }, - "limit": { - "context": 32768, - "output": 32768 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2026-03-15", - "cost": { - "input": 0.8, - "output": 1.6 - }, "type": "chat" }, { - "id": "aion-labs/aion-2.0", - "name": "AionLabs: Aion-2.0", - "display_name": "AionLabs: Aion-2.0", + "id": "google/gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-03-15", - "cost": { - "input": 0.8, - "output": 1.6 - }, - "type": "chat" - }, - { - "id": "aion-labs/aion-1.0-mini", - "name": "AionLabs: Aion-1.0-Mini", - "display_name": "AionLabs: Aion-1.0-Mini", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 32768 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2026-03-15", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.7, - "output": 1.4 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "input_audio": 1 }, "type": "chat" }, { - "id": "thedrummer/unslopnemo-12b", - "name": "TheDrummer: UnslopNemo 12B", - "display_name": "TheDrummer: UnslopNemo 12B", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-11-09", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.4, - "output": 0.4 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 }, "type": "chat" }, { - "id": "thedrummer/cydonia-24b-v4.1", - "name": "TheDrummer: Cydonia 24B V4.1", - "display_name": "TheDrummer: Cydonia 24B V4.1", + "id": "deepseek/deepseek-chat", + "name": "DeepSeek Chat", + "display_name": "DeepSeek Chat", "modalities": { "input": [ "text" @@ -66735,28 +76193,30 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1000000, + "output": 384000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-09-27", - "last_updated": "2026-03-15", + "knowledge": "2025-09", + "release_date": "2025-12-01", + "last_updated": "2026-02-28", "cost": { - "input": 0.3, - "output": 0.5 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "thedrummer/skyfall-36b-v2", - "name": "TheDrummer: Skyfall 36B V2", - "display_name": "TheDrummer: Skyfall 36B V2", + "id": "deepseek/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -66766,28 +76226,42 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 1000000, + "output": 384000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2025-03-11", - "last_updated": "2026-03-15", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.55, - "output": 0.8 + "input": 0.56, + "output": 1.12, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "thedrummer/rocinante-12b", - "name": "TheDrummer: Rocinante 12B", - "display_name": "TheDrummer: Rocinante 12B", + "id": "deepseek/deepseek-reasoner", + "name": "DeepSeek Reasoner", + "display_name": "DeepSeek Reasoner", "modalities": { "input": [ "text" @@ -66797,32 +76271,44 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "release_date": "2024-09-30", - "last_updated": "2026-03-15", + "knowledge": "2025-09", + "release_date": "2025-12-01", + "last_updated": "2026-02-28", "cost": { - "input": 0.17, - "output": 0.43 + "input": 0.435, + "output": 0.87, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.1", - "name": "Anthropic: Claude Opus 4.1", - "display_name": "Anthropic: Claude Opus 4.1", + "id": "deepseek/deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -66830,8 +76316,8 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -66839,35 +76325,55 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.19, + "output": 0.37, + "cache_read": 0.028 }, "type": "chat" - }, + } + ] + }, + "opencode-go": { + "id": "opencode-go", + "name": "OpenCode Go", + "display_name": "OpenCode Go", + "api": "https://opencode.ai/zen/go/v1", + "doc": "https://opencode.ai/docs/zen", + "models": [ { - "id": "anthropic/claude-3.7-sonnet:thinking", - "name": "Anthropic: Claude 3.7 Sonnet (thinking)", - "display_name": "Anthropic: Claude 3.7 Sonnet (thinking)", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -66878,105 +76384,80 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", + "interleaved": true, + "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" ] } }, "attachment": true, - "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2026-03-15", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6-fast", - "name": "Anthropic: Claude Opus 4.6 (Fast)", - "display_name": "Anthropic: Claude Opus 4.6 (Fast)", + "id": "qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ + "text", "image", - "text" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-04-07", - "last_updated": "2026-04-11", + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 30, - "output": 150, - "cache_read": 3, - "cache_write": 37.5 + "input": 0.2, + "output": 1.2, + "cache_read": 0.02, + "cache_write": 0.25 }, "type": "chat" }, { - "id": "anthropic/claude-3.7-sonnet", - "name": "Anthropic: Claude 3.7 Sonnet", - "display_name": "Anthropic: Claude 3.7 Sonnet", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -66984,118 +76465,93 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 202752, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", + "interleaved": true, + "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6", - "name": "Anthropic: Claude Opus 4.6", - "display_name": "Anthropic: Claude Opus 4.6", + "id": "mimo-v2-omni", + "name": "MiMo V2 Omni", + "display_name": "MiMo V2 Omni", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 262144, "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.4, + "output": 2, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.7", - "name": "Anthropic: Claude Opus 4.7", - "display_name": "Anthropic: Claude Opus 4.7", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -67103,58 +76559,43 @@ }, "limit": { "context": 1000000, - "output": 128000 + "output": 384000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], "interleaved": true, "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-16", - "last_updated": "2026-05-01", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1.74, + "output": 3.48, + "cache_read": 0.0145 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4", - "name": "Anthropic: Claude Sonnet 4", - "display_name": "Anthropic: Claude Sonnet 4", + "id": "mimo-v2.5-pro", + "name": "MiMo V2.5 Pro", + "display_name": "MiMo V2.5 Pro", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -67162,8 +76603,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -67171,26 +76612,51 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2026-03-15", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1, + "output": 3, + "cache_read": 0.2, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.5", - "name": "Anthropic: Claude Sonnet 4.5", - "display_name": "Anthropic: Claude Sonnet 4.5", + "id": "minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -67198,8 +76664,8 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 204800, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -67207,26 +76673,29 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.5", - "name": "Anthropic: Claude Opus 4.5", - "display_name": "Anthropic: Claude Opus 4.5", + "id": "minimax-m2.7", + "name": "MiniMax M2.7", + "display_name": "MiniMax M2.7", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -67234,8 +76703,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -67243,60 +76712,83 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-24", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "anthropic/claude-3-haiku", - "name": "Anthropic: Claude 3 Haiku", - "display_name": "Anthropic: Claude 3 Haiku", + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2024-03-07", - "last_updated": "2024-03-07", + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 0.625 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4", - "name": "Anthropic: Claude Opus 4", - "display_name": "Anthropic: Claude Opus 4", + "id": "mimo-v2-pro", + "name": "MiMo V2 Pro", + "display_name": "MiMo V2 Pro", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -67304,8 +76796,8 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1048576, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -67313,59 +76805,115 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2026-03-15", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 1, + "output": 3, + "cache_read": 0.2, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "anthropic/claude-3.5-haiku", - "name": "Anthropic: Claude 3.5 Haiku", - "display_name": "Anthropic: Claude 3.5 Haiku", + "id": "mimo-v2.5", + "name": "MiMo V2.5", + "display_name": "MiMo V2.5", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.8, - "output": 4, + "input": 0.4, + "output": 2, "cache_read": 0.08, - "cache_write": 1 + "tiers": [ + { + "input": 0.8, + "output": 4, + "cache_read": 0.16, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 0.8, + "output": 4, + "cache_read": 0.16 + } }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4.5", - "name": "Anthropic: Claude Haiku 4.5", - "display_name": "Anthropic: Claude Haiku 4.5", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -67373,8 +76921,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -67382,25 +76930,35 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.14, + "output": 0.28, + "cache_read": 0.0028 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.6", - "name": "Anthropic: Claude Sonnet 4.6", - "display_name": "Anthropic: Claude Sonnet 4.6", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -67408,91 +76966,100 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 202752, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 3, - "output": 15 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "switchpoint/router", - "name": "Switchpoint Router", - "display_name": "Switchpoint Router", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-07-12", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.85, - "output": 3.4 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" - }, + } + ] + }, + "llmgateway": { + "id": "llmgateway", + "name": "LLM Gateway", + "display_name": "LLM Gateway", + "api": "https://api.llmgateway.io/v1", + "doc": "https://llmgateway.io/docs", + "models": [ { - "id": "bytedance/ui-tars-1.5-7b", - "name": "ByteDance: UI-TARS 7B ", - "display_name": "ByteDance: UI-TARS 7B ", + "id": "gemma-2-27b-it-together", + "name": "Gemma 2 27B IT", + "display_name": "Gemma 2 27B IT", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -67500,28 +77067,28 @@ ] }, "limit": { - "context": 128000, - "output": 2048 + "context": 8192, + "output": 16384 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-07-23", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "release_date": "2024-06-27", + "last_updated": "2024-06-27", "cost": { - "input": 0.1, - "output": 0.2 + "input": 0.08, + "output": 0.08 }, "type": "chat" }, { - "id": "tngtech/deepseek-r1t2-chimera", - "name": "TNG: DeepSeek R1T2 Chimera", - "display_name": "TNG: DeepSeek R1T2 Chimera", + "id": "qwen3-30b-a3b-instruct-2507", + "name": "Qwen3 30B A3B Instruct (2507)", + "display_name": "Qwen3 30B A3B Instruct (2507)", "modalities": { "input": [ "text" @@ -67531,30 +77098,28 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, "release_date": "2025-07-08", "last_updated": "2025-07-08", "cost": { - "input": 0.25, - "output": 0.85, - "cache_read": 0.125 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2.5-pro", - "name": "Xiaomi: MiMo V2.5 Pro", - "display_name": "Xiaomi: MiMo V2.5 Pro", + "id": "claude-3-7-sonnet", + "name": "Claude 3.7 Sonnet", + "display_name": "Claude 3.7 Sonnet", "modalities": { "input": [ "text" @@ -67564,99 +77129,94 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" ] } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "open_weights": false, + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2, - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 3, + "output": 15, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-omni", - "name": "Xiaomi: MiMo-V2-Omni", - "display_name": "Xiaomi: MiMo-V2-Omni", + "id": "qwen3-vl-235b-a22b-instruct", + "name": "Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen3 VL 235B A22B Instruct", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": true, + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08 + "input": 0.8, + "output": 2.4 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2.5", - "name": "Xiaomi: MiMo-V2.5", - "display_name": "Xiaomi: MiMo-V2.5", + "id": "seed-1-6-250615", + "name": "Seed 1.6 (250615)", + "display_name": "Seed 1.6 (250615)", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -67664,88 +77224,65 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2025-06-25", + "last_updated": "2025-06-25", "cost": { - "input": 0.4, + "input": 0.25, "output": 2, - "cache_read": 0.08, - "context_over_200k": { - "input": 0.8, - "output": 4, - "cache_read": 0.16 - } + "cache_read": 0.05 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-pro", - "name": "Xiaomi: MiMo-V2-Pro", - "display_name": "Xiaomi: MiMo-V2-Pro", + "id": "gpt-4o-mini-search-preview", + "name": "GPT-4o Mini Search Preview", + "display_name": "GPT-4o Mini Search Preview", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2, - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash", - "name": "Xiaomi: MiMo-V2-Flash", - "display_name": "Xiaomi: MiMo-V2-Flash", + "id": "seed-1-6-flash-250715", + "name": "Seed 1.6 Flash (250715)", + "display_name": "Seed 1.6 Flash (250715)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -67753,139 +77290,116 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 0.09, - "output": 0.29, - "cache_read": 0.045 - }, - "type": "chat" - } - ] - }, - "sap-ai-core": { - "id": "sap-ai-core", - "name": "SAP AI Core", - "display_name": "SAP AI Core", - "doc": "https://help.sap.com/docs/sap-ai-core", - "models": [ + "input": 0.07, + "output": 0.3, + "cache_read": 0.01 + }, + "type": "chat" + }, { - "id": "anthropic--claude-4.6-opus", - "name": "anthropic--claude-4.6-opus", - "display_name": "anthropic--claude-4.6-opus", + "id": "qwen2-5-vl-32b-instruct", + "name": "Qwen2.5 VL 32B Instruct", + "display_name": "Qwen2.5 VL 32B Instruct", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "open_weights": true, + "release_date": "2025-03-15", + "last_updated": "2025-03-15", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "anthropic--claude-3-haiku", - "name": "anthropic--claude-3-haiku", - "display_name": "anthropic--claude-3-haiku", + "id": "gemma-3-27b", + "name": "Gemma 3 27B", + "display_name": "Gemma 3 27B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-13", - "last_updated": "2024-03-13", + "open_weights": true, + "release_date": "2025-03-12", + "last_updated": "2025-03-12", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 + "input": 0.27, + "output": 0.27 }, "type": "chat" }, { - "id": "anthropic--claude-3-opus", - "name": "anthropic--claude-3-opus", - "display_name": "anthropic--claude-3-opus", + "id": "llama-3.1-70b-instruct", + "name": "Llama 3.1 70B Instruct", + "display_name": "Llama 3.1 70B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 128000, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.72, + "output": 0.72 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "gpt-5-mini", - "display_name": "gpt-5-mini", + "id": "qwen3-vl-235b-a22b-thinking", + "name": "Qwen3 VL 235B A22B Thinking", + "display_name": "Qwen3 VL 235B A22B Thinking", "modalities": { "input": [ "text", @@ -67896,10 +77410,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -67908,40 +77422,28 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.8, + "output": 2.4 }, "type": "chat" }, { - "id": "gpt-5-nano", - "name": "gpt-5-nano", - "display_name": "gpt-5-nano", + "id": "grok-4-1-fast-reasoning", + "name": "Grok 4.1 Fast Reasoning", + "display_name": "Grok 4.1 Fast Reasoning", "modalities": { "input": [ "text", @@ -67952,10 +77454,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 2000000, + "output": 30000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -67963,56 +77465,36 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "gemini-2.5-pro", - "display_name": "gemini-2.5-pro", + "id": "seed-1-6-250915", + "name": "Seed 1.6 (250915)", + "display_name": "Seed 1.6 (250915)", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -68020,181 +77502,151 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-25", - "last_updated": "2025-06-05", + "open_weights": true, + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.25, + "output": 2, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "anthropic--claude-3.7-sonnet", - "name": "anthropic--claude-3.7-sonnet", - "display_name": "anthropic--claude-3.7-sonnet", + "id": "deepseek-r1-0528", + "name": "DeepSeek R1 (0528)", + "display_name": "DeepSeek R1 (0528)", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 64000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", + "interleaved": true, + "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "attachment": false, + "open_weights": true, + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.8, + "output": 2.4 }, "type": "chat" }, { - "id": "sonar-pro", - "name": "sonar-pro", - "display_name": "sonar-pro", + "id": "codestral-2508", + "name": "Codestral", + "display_name": "Codestral", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { - "input": 3, - "output": 15 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "anthropic--claude-4.5-sonnet", - "name": "anthropic--claude-4.5-sonnet", - "display_name": "anthropic--claude-4.5-sonnet", + "id": "qwen3-vl-flash", + "name": "Qwen3 VL Flash", + "display_name": "Qwen3 VL Flash", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-10-09", + "last_updated": "2025-10-09", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "anthropic--claude-4.6-sonnet", - "name": "anthropic--claude-4.6-sonnet", - "display_name": "anthropic--claude-4.6-sonnet", + "id": "glm-4.6v-flash", + "name": "GLM-4.6V Flash", + "display_name": "GLM-4.6V Flash", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 16000 }, "temperature": true, "tool_call": true, @@ -68203,63 +77655,62 @@ "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "open_weights": true, + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "sonar-deep-research", - "name": "sonar-deep-research", - "display_name": "sonar-deep-research", + "id": "deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 163840, + "output": 16384 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-02-01", - "last_updated": "2025-09-01", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 2, - "output": 8, - "reasoning": 3 + "input": 0.28, + "output": 0.42, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "gemini-2.5-flash", - "display_name": "gemini-2.5-flash", + "id": "gemini-pro-latest", + "name": "Gemini Pro Latest", + "display_name": "Gemini Pro Latest", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" @@ -68275,56 +77726,32 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-25", - "last_updated": "2025-06-05", + "release_date": "2026-02-27", + "last_updated": "2026-02-27", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.03, - "input_audio": 1 + "input": 2, + "output": 12, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "anthropic--claude-4.5-opus", - "name": "anthropic--claude-4.5-opus", - "display_name": "anthropic--claude-4.5-opus", + "id": "qwen3-30b-a3b-fp8", + "name": "Qwen3 30B A3B FP8", + "display_name": "Qwen3 30B A3B FP8", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -68332,23 +77759,20 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "sonar", - "name": "sonar", - "display_name": "sonar", + "id": "qwen-coder-plus", + "name": "Qwen Coder Plus", + "display_name": "Qwen Coder Plus", "modalities": { "input": [ "text" @@ -68358,289 +77782,217 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 1, + "input": 0.5, "output": 1 }, "type": "chat" }, { - "id": "anthropic--claude-4-opus", - "name": "anthropic--claude-4-opus", - "display_name": "anthropic--claude-4-opus", + "id": "minimax-m2.1-lightning", + "name": "MiniMax M2.1 Lightning", + "display_name": "MiniMax M2.1 Lightning", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 196608, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.12, + "output": 0.48 }, "type": "chat" }, { - "id": "anthropic--claude-3-sonnet", - "name": "anthropic--claude-3-sonnet", - "display_name": "anthropic--claude-3-sonnet", + "id": "llama-3.1-nemotron-ultra-253b", + "name": "Llama 3.1 Nemotron Ultra 253B", + "display_name": "Llama 3.1 Nemotron Ultra 253B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-04", - "last_updated": "2024-03-04", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-07", + "last_updated": "2025-04-07", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.6, + "output": 1.8 }, "type": "chat" }, { - "id": "anthropic--claude-4-sonnet", - "name": "anthropic--claude-4-sonnet", - "display_name": "anthropic--claude-4-sonnet", + "id": "qwen-max-latest", + "name": "Qwen Max Latest", + "display_name": "Qwen Max Latest", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-01-25", + "last_updated": "2025-01-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1.6, + "output": 6.4 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "gemini-2.5-flash-lite", - "display_name": "gemini-2.5-flash-lite", + "id": "glm-4.5-airx", + "name": "GLM-4.5 AirX", + "display_name": "GLM-4.5 AirX", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 1.1, + "output": 4.5, + "cache_read": 0.22 }, "type": "chat" }, { - "id": "anthropic--claude-4.5-haiku", - "name": "anthropic--claude-4.5-haiku", - "display_name": "anthropic--claude-4.5-haiku", + "id": "llama-3.2-11b-instruct", + "name": "Llama 3.2 11B Instruct", + "display_name": "Llama 3.2 11B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.07, + "output": 0.33 }, "type": "chat" }, { - "id": "gpt-5", - "name": "gpt-5", - "display_name": "gpt-5", + "id": "grok-4-0709", + "name": "Grok 4 (0709)", + "display_name": "Grok 4 (0709)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 256000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "gpt-4.1", - "display_name": "gpt-4.1", + "id": "ministral-14b-2512", + "name": "Ministral 14B", + "display_name": "Ministral 14B", "modalities": { "input": [ "text", @@ -68651,30 +78003,28 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 262144, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "gpt-4.1-mini", - "display_name": "gpt-4.1-mini", + "id": "gpt-4o-search-preview", + "name": "GPT-4o Search Preview", + "display_name": "GPT-4o Search Preview", "modalities": { "input": [ "text", @@ -68685,106 +78035,65 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "anthropic--claude-3.5-sonnet", - "name": "anthropic--claude-3.5-sonnet", - "display_name": "anthropic--claude-3.5-sonnet", + "id": "gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 131072, + "output": 32766 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" - } - ] - }, - "morph": { - "id": "morph", - "name": "Morph", - "display_name": "Morph", - "api": "https://api.morphllm.com/v1", - "doc": "https://docs.morphllm.com/api-reference/introduction", - "models": [ - { - "id": "auto", - "name": "Auto", - "display_name": "Auto", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32000, - "output": 32000 + "supported": true, + "default": true }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.85, - "output": 1.55 + "input": 0.1, + "output": 0.5 }, "type": "chat" }, { - "id": "morph-v3-fast", - "name": "Morph v3 Fast", - "display_name": "Morph v3 Fast", + "id": "qwen3-coder-next", + "name": "Qwen3 Coder Next", + "display_name": "Qwen3 Coder Next", "modalities": { "input": [ "text" @@ -68794,28 +78103,29 @@ ] }, "limit": { - "context": 16000, - "output": 16000 + "context": 262144, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { "input": 0.8, - "output": 1.2 + "output": 4 }, "type": "chat" }, { - "id": "morph-v3-large", - "name": "Morph v3 Large", - "display_name": "Morph v3 Large", + "id": "qwen3-30b-a3b-thinking-2507", + "name": "Qwen3 30B A3B Thinking (2507)", + "display_name": "Qwen3 30B A3B Thinking (2507)", "modalities": { "input": [ "text" @@ -68825,51 +78135,10 @@ ] }, "limit": { - "context": 32000, - "output": 32000 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", - "cost": { - "input": 0.9, - "output": 1.9 - }, - "type": "chat" - } - ] - }, - "cloudflare-ai-gateway": { - "id": "cloudflare-ai-gateway", - "name": "Cloudflare AI Gateway", - "display_name": "Cloudflare AI Gateway", - "doc": "https://developers.cloudflare.com/ai-gateway/", - "models": [ - { - "id": "openai/gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -68878,73 +78147,59 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-08", + "last_updated": "2025-07-08", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "openai/gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "llama-4-scout", + "name": "Llama 4 Scout", + "display_name": "Llama 4 Scout", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 10, - "output": 30 + "input": 0.18, + "output": 0.59 }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "ministral-3b-2512", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ "text", @@ -68955,199 +78210,137 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "open_weights": true, + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "openai/o3-pro", - "name": "o3-pro", - "display_name": "o3-pro", + "id": "qwen3-4b-fp8", + "name": "Qwen3 4B FP8", + "display_name": "Qwen3 4B FP8", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-06-10", - "last_updated": "2025-06-10", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 20, - "output": 80 + "input": 0.03, + "output": 0.05 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "qwen3-235b-a22b-fp8", + "name": "Qwen3 235B A22B FP8", + "display_name": "Qwen3 235B A22B FP8", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "input": 0.5, + "output": 2.5 }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "qwen25-coder-7b", + "name": "Qwen2.5 Coder 7B", + "display_name": "Qwen2.5 Coder 7B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "attachment": false, + "open_weights": true, + "release_date": "2024-09-19", + "last_updated": "2024-09-19", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 0.05, + "output": 0.05 }, "type": "chat" }, { - "id": "openai/gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "qwen3-vl-30b-a3b-thinking", + "name": "Qwen3 VL 30B A3B Thinking", + "display_name": "Qwen3 VL 30B A3B Thinking", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -69156,40 +78349,28 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "open_weights": true, + "release_date": "2025-10-02", + "last_updated": "2025-10-02", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "deepseek-v3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text", @@ -69200,52 +78381,30 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": true, + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.56, + "output": 1.68, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "openai/o1", - "name": "o1", - "display_name": "o1", + "id": "llama-4-scout-17b-instruct", + "name": "Llama 4 Scout 17B Instruct", + "display_name": "Llama 4 Scout 17B Instruct", "modalities": { "input": [ "text", @@ -69256,45 +78415,28 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 8192, + "output": 2048 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.17, + "output": 0.66 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo", - "name": "GPT-3.5-turbo", - "display_name": "GPT-3.5-turbo", + "id": "qwen3-32b-fp8", + "name": "Qwen3 32B FP8", + "display_name": "Qwen3 32B FP8", "modalities": { "input": [ "text" @@ -69304,33 +78446,33 @@ ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2021-09-01", - "release_date": "2023-03-01", - "last_updated": "2023-11-06", + "open_weights": true, + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 0.5, - "output": 1.5, - "cache_read": 1.25 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "openai/o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "claude-3-opus", + "name": "Claude 3 Opus", + "display_name": "Claude 3 Opus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -69338,44 +78480,28 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 15, + "output": 75, + "cache_read": 1.5 }, "type": "chat" }, { - "id": "openai/gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct (2507)", + "display_name": "Qwen3 235B A22B Instruct (2507)", "modalities": { "input": [ "text" @@ -69385,7 +78511,7 @@ ] }, "limit": { - "context": 8192, + "context": 131072, "output": 8192 }, "temperature": true, @@ -69393,128 +78519,83 @@ "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-08", + "last_updated": "2025-07-08", "cost": { - "input": 30, - "output": 60 + "input": 0.8, + "output": 2.4 }, "type": "chat" }, { - "id": "openai/gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "custom", + "name": "Custom Model", + "display_name": "Custom Model", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 128000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/o3", - "name": "o3", - "display_name": "o3", + "id": "llama-3-70b-instruct", + "name": "Llama 3 70B Instruct", + "display_name": "Llama 3 70B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 8192, + "output": 8000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "attachment": false, + "open_weights": true, + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.51, + "output": 0.74 }, "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "qwen3-vl-8b-instruct", + "name": "Qwen3 VL 8B Instruct", + "display_name": "Qwen3 VL 8B Instruct", "modalities": { "input": [ "text", @@ -69525,271 +78606,209 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "open_weights": true, + "release_date": "2025-08-19", + "last_updated": "2025-08-19", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22B Thinking (2507)", + "display_name": "Qwen3 235B A22B Thinking (2507)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-08", + "last_updated": "2025-07-08", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.8, + "output": 2.4 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4-5", - "name": "Claude Haiku 4.5 (latest)", - "display_name": "Claude Haiku 4.5 (latest)", + "id": "kimi-k2", + "name": "Kimi K2", + "display_name": "Kimi K2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-11", + "last_updated": "2025-07-11", "cost": { "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "output": 3, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "claude-3-5-haiku", + "name": "Claude 3.5 Haiku", + "display_name": "Claude 3.5 Haiku", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5 - } + "input": 0.8, + "output": 4, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "llama-3-8b-instruct", + "name": "Llama 3 8B Instruct", + "display_name": "Llama 3 8B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 8192, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "cost": { + "input": 0.04, + "output": 0.04 }, - "attachment": true, - "open_weights": false, - "knowledge": "2026-01", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "type": "chat" + }, + { + "id": "gemma-3-1b-it", + "name": "Gemma 3 1B IT", + "display_name": "Gemma 3 1B IT", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-03-12", + "last_updated": "2025-03-12", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.08, + "output": 0.3 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-1", - "name": "Claude Opus 4.1 (latest)", - "display_name": "Claude Opus 4.1 (latest)", + "id": "qwen3-max-2026-01-23", + "name": "Qwen3 Max (2026-01-23)", + "display_name": "Qwen3 Max (2026-01-23)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 256000, + "output": 32800 }, "temperature": true, "tool_call": true, @@ -69799,148 +78818,138 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-01-23", + "last_updated": "2026-01-23", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 3, + "output": 15, + "cache_read": 0.6 }, "type": "chat" }, { - "id": "anthropic/claude-3-5-haiku", - "name": "Claude Haiku 3.5 (latest)", - "display_name": "Claude Haiku 3.5 (latest)", + "id": "glm-4.6v-flashx", + "name": "GLM-4.6V FlashX", + "display_name": "GLM-4.6V FlashX", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 16000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 0.04, + "output": 0.4, + "cache_read": 0 }, "type": "chat" }, { - "id": "anthropic/claude-3.5-sonnet", - "name": "Claude Sonnet 3.5 v2", - "display_name": "Claude Sonnet 3.5 v2", + "id": "minimax-text-01", + "name": "MiniMax Text 01", + "display_name": "MiniMax Text 01", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 1000000, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "attachment": false, + "open_weights": true, + "release_date": "2025-01-15", + "last_updated": "2025-01-15", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.2, + "output": 1.1 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4 (latest)", - "display_name": "Claude Sonnet 4 (latest)", + "id": "llama-3.2-3b-instruct", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.03, + "output": 0.05 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-5", - "name": "Claude Opus 4.5 (latest)", - "display_name": "Claude Opus 4.5 (latest)", + "id": "gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 32766 }, "temperature": true, "tool_call": true, @@ -69953,177 +78962,128 @@ "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.15, + "output": 0.75 }, "type": "chat" }, { - "id": "anthropic/claude-3-haiku", - "name": "Claude Haiku 3", - "display_name": "Claude Haiku 3", + "id": "hermes-2-pro-llama-3-8b", + "name": "Hermes 2 Pro Llama 3 8B", + "display_name": "Hermes 2 Pro Llama 3 8B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-13", - "last_updated": "2024-03-13", + "attachment": false, + "open_weights": true, + "release_date": "2024-05-27", + "last_updated": "2024-05-27", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 + "input": 0.14, + "output": 0.14 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4", - "name": "Claude Opus 4 (latest)", - "display_name": "Claude Opus 4 (latest)", + "id": "ministral-8b-2512", + "name": "Ministral 8B", + "display_name": "Ministral 8B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 262144, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "open_weights": true, + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-6", - "name": "Claude Opus 4.6 (latest)", - "display_name": "Claude Opus 4.6 (latest)", + "id": "seed-1-8-251228", + "name": "Seed 1.8 (251228)", + "display_name": "Seed 1.8 (251228)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "open_weights": true, + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25, - "context_over_200k": { - "input": 10, - "output": 37.5, - "cache_read": 1, - "cache_write": 12.5 - } + "input": 0.25, + "output": 2, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "anthropic/claude-3.5-haiku", - "name": "Claude Haiku 3.5 (latest)", - "display_name": "Claude Haiku 3.5 (latest)", + "id": "qwen3-vl-30b-a3b-instruct", + "name": "Qwen3 VL 30B A3B Instruct", + "display_name": "Qwen3 VL 30B A3B Instruct", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 131072, "output": 8192 }, "temperature": true, @@ -70132,77 +79092,63 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "open_weights": true, + "release_date": "2025-10-02", + "last_updated": "2025-10-02", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 0.1, + "output": 0.1 }, "type": "chat" - }, - { - "id": "anthropic/claude-sonnet-4-5", - "name": "Claude Sonnet 4.5 (latest)", - "display_name": "Claude Sonnet 4.5 (latest)", + }, + { + "id": "llama-4-maverick-17b-instruct", + "name": "Llama 4 Maverick 17B Instruct", + "display_name": "Llama 4 Maverick 17B Instruct", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.24, + "output": 0.97 }, "type": "chat" }, { - "id": "anthropic/claude-3-sonnet", - "name": "Claude Sonnet 3", - "display_name": "Claude Sonnet 3", + "id": "auto", + "name": "Auto Route", + "display_name": "Auto Route", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -70211,128 +79157,82 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-04", - "last_updated": "2024-03-04", + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "anthropic/claude-3-opus", - "name": "Claude Opus 3", - "display_name": "Claude Opus 3", + "id": "glm-4.5-x", + "name": "GLM-4.5 X", + "display_name": "GLM-4.5 X", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 2.2, + "output": 8.9, + "cache_read": 0.45 }, "type": "chat" }, { - "id": "openai/gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "glm-4-32b-0414-128k", + "name": "GLM-4 32B (0414-128k)", + "display_name": "GLM-4 32B (0414-128k)", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 128000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 0.1, + "output": 0.1 }, "type": "chat" - } - ] - }, - "github-copilot": { - "id": "github-copilot", - "name": "GitHub Copilot", - "display_name": "GitHub Copilot", - "api": "https://api.githubcopilot.com", - "doc": "https://docs.github.com/en/copilot", - "models": [ + }, { - "id": "gpt-5.1-codex-max", - "name": "GPT-5.1-Codex-max", - "display_name": "GPT-5.1-Codex-max", + "id": "grok-4-fast-reasoning", + "name": "Grok 4 Fast Reasoning", + "display_name": "Grok 4 Fast Reasoning", "modalities": { "input": [ "text", @@ -70343,51 +79243,35 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 2000000, + "output": 30000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-12-04", - "last_updated": "2025-12-04", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0, - "output": 0 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "claude-opus-4.6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "qwen-plus-latest", + "name": "Qwen Plus Latest", + "display_name": "Qwen Plus Latest", "modalities": { "input": [ "text", @@ -70398,60 +79282,42 @@ ] }, "limit": { - "context": 144000, - "output": 64000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "release_date": "2025-01-25", + "last_updated": "2025-01-25", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -70459,60 +79325,40 @@ }, "limit": { "context": 128000, - "output": 64000 + "output": 2048 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0, - "output": 0 + "input": 0.22, + "output": 0.22 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash", - "display_name": "Gemini 3 Flash", + "id": "claude-opus-4-1-20250805", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ "text", "image", - "audio", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -70520,40 +79366,23 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0, - "output": 0 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "qwen2-5-vl-72b-instruct", + "name": "Qwen2.5-VL 72B Instruct", + "display_name": "Qwen2.5-VL 72B Instruct", "modalities": { "input": [ "text", @@ -70564,51 +79393,29 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0, - "output": 0 + "input": 2.8, + "output": 8.4 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5-mini", - "display_name": "GPT-5-mini", + "id": "mistral-large-2512", + "name": "Mistral Large 3", + "display_name": "Mistral Large 3", "modalities": { "input": [ "text", @@ -70619,65 +79426,40 @@ ] }, "limit": { - "context": 264000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-08-13", - "last_updated": "2025-08-13", + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", "cost": { - "input": 0, - "output": 0 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "minimax-m2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -70687,48 +79469,36 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3-Codex", - "display_name": "GPT-5.3-Codex", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 262144 }, "temperature": false, "tool_call": true, @@ -70739,52 +79509,42 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ "text", "image", - "audio", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 200000, "output": 64000 }, "temperature": true, @@ -70795,208 +79555,151 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0, - "output": 0 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "minimax-m2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 264000, - "output": 64000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 Mini", - "display_name": "GPT-5.4 Mini", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0, - "output": 0 + "input": 6, + "output": 24, + "cache_read": 1.3, + "cache_write": 0 }, "type": "chat" }, { - "id": "claude-opus-4.7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 144000, - "output": 64000 + "context": 128000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 0, - "output": 0 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2-Codex", - "display_name": "GPT-5.2-Codex", + "id": "qwen3-vl-plus", + "name": "Qwen3-VL Plus", + "display_name": "Qwen3-VL Plus", "modalities": { "input": [ "text", @@ -71007,10 +79710,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -71019,39 +79722,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0, - "output": 0 + "input": 0.2, + "output": 1.6, + "reasoning": 4.8 }, "type": "chat" }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1-Codex-mini", - "display_name": "GPT-5.1-Codex-mini", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", @@ -71081,7 +79775,8 @@ "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -71092,33 +79787,37 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0, - "output": 0 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "mimo-v2-omni", + "name": "MiMo-V2-Omni", + "display_name": "MiMo-V2-Omni", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 216000, - "output": 16000 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -71126,21 +79825,33 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0, - "output": 0 + "input": 0.4, + "output": 2, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "gpt-3.5-turbo", + "name": "GPT-3.5-turbo", + "display_name": "GPT-3.5-turbo", "modalities": { "input": [ "text" @@ -71150,102 +79861,87 @@ ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 16385, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-08", - "release_date": "2025-08-27", - "last_updated": "2025-08-27", + "knowledge": "2021-09-01", + "release_date": "2023-03-01", + "last_updated": "2023-11-06", "cost": { - "input": 0, - "output": 0 + "input": 0.5, + "output": 1.5, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "gemini-3.1-flash-lite", + "name": "Gemini 3.1 Flash Lite", + "display_name": "Gemini 3.1 Flash Lite", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 264000, - "output": 64000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-01", + "release_date": "2026-05-07", + "last_updated": "2026-05-07", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "claude-sonnet-4.5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "claude-haiku-4-5-20251001", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 144000, - "output": 32000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -71255,53 +79951,21 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - }, - { - "id": "claude-opus-41", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 80000, - "output": 16000 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0, - "output": 0 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "claude-opus-4.5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "grok-4-3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ "text", @@ -71312,8 +79976,8 @@ ] }, "limit": { - "context": 160000, - "output": 32000 + "context": 1000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -71323,19 +79987,35 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "release_date": "2026-05-01", + "last_updated": "2026-05-01", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2, + "context_over_200k": { + "input": 2.5, + "output": 5, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 2.5, + "output": 5, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "gpt-5.4-nano", + "name": "GPT-5.4 nano", + "display_name": "GPT-5.4 nano", "modalities": { "input": [ "text", @@ -71377,66 +80057,37 @@ "visibility": "hidden" } }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - }, - { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0, - "output": 0 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -71448,38 +80099,53 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + }, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "claude-haiku-4.5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "gpt-5-chat-latest", + "name": "GPT-5 Chat (latest)", + "display_name": "GPT-5 Chat (latest)", "modalities": { "input": [ "text", @@ -71490,123 +80156,121 @@ ] }, "limit": { - "context": 144000, - "output": 32000 + "context": 400000, + "output": 128000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "minimax-m2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 196608, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "claude-sonnet-4.6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "gpt-5.5-pro", + "name": "GPT-5.5 Pro", + "display_name": "GPT-5.5 Pro", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0, - "output": 0 + "input": 30, + "output": 180, + "context_over_200k": { + "input": 60, + "output": 270 + }, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1-Codex", - "display_name": "GPT-5.1-Codex", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex mini", + "display_name": "GPT-5.1 Codex mini", "modalities": { "input": [ "text", @@ -71647,30 +80311,22 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, "knowledge": "2024-09-30", "release_date": "2025-11-13", "last_updated": "2025-11-13", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" - } - ] - }, - "mixlayer": { - "id": "mixlayer", - "name": "Mixlayer", - "display_name": "Mixlayer", - "api": "https://models.mixlayer.ai/v1", - "doc": "https://docs.mixlayer.com", - "models": [ + }, { - "id": "qwen/qwen3.5-122b-a10b", - "name": "Qwen3.5 122B A10B", - "display_name": "Qwen3.5 122B A10B", + "id": "qwq-plus", + "name": "QwQ Plus", + "display_name": "QwQ Plus", "modalities": { "input": [ "text" @@ -71680,8 +80336,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -71701,32 +80357,34 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "cost": { - "input": 0.4, - "output": 3.2 + "input": 0.8, + "output": 2.4 }, "type": "chat" }, { - "id": "qwen/qwen3.5-27b", - "name": "Qwen3.5 27B", - "display_name": "Qwen3.5 27B", + "id": "gpt-5.2-pro", + "name": "GPT-5.2 Pro", + "display_name": "GPT-5.2 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -71735,28 +80393,38 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.3, - "output": 2.4 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "qwen/qwen3.5-397b-a17b", - "name": "Qwen3.5 397B A17B", - "display_name": "Qwen3.5 397B A17B", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -71766,8 +80434,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -71788,18 +80456,20 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.6, - "output": 3.6 + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "qwen/qwen3.5-9b", - "name": "Qwen3.5 9B", - "display_name": "Qwen3.5 9B", + "id": "sonar", + "name": "Sonar", + "display_name": "Sonar", "modalities": { "input": [ "text" @@ -71809,51 +80479,42 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": false, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 0.1, - "output": 0.4 + "input": 1, + "output": 1 }, "type": "chat" }, { - "id": "qwen/qwen3.5-35b-a3b", - "name": "Qwen3.5 35B A3B", - "display_name": "Qwen3.5 35B A3B", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -71863,68 +80524,61 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.25, - "output": 1.3 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" - } - ] - }, - "xiaomi-token-plan-sgp": { - "id": "xiaomi-token-plan-sgp", - "name": "Xiaomi Token Plan (Singapore)", - "display_name": "Xiaomi Token Plan (Singapore)", - "api": "https://token-plan-sgp.xiaomimimo.com/v1", - "doc": "https://platform.xiaomimimo.com/#/docs", - "models": [ + }, { - "id": "mimo-v2-tts", - "name": "MiMo-V2-TTS", - "display_name": "MiMo-V2-TTS", + "id": "qwen35-397b-a17b", + "name": "Qwen3.5 397B-A17B", + "display_name": "Qwen3.5 397B-A17B", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 16384 + "context": 262144, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "mimo-v2-flash", - "name": "MiMo-V2-Flash", - "display_name": "MiMo-V2-Flash", + "id": "glm-4.7-flashx", + "name": "GLM-4.7-FlashX", + "display_name": "GLM-4.7-FlashX", "modalities": { "input": [ "text" @@ -71934,8 +80588,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -71943,33 +80597,23 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.07, + "output": 0.4, + "cache_read": 0.01, + "cache_write": 0 }, "type": "chat" }, { - "id": "mimo-v2-pro", - "name": "MiMo-V2-Pro", - "display_name": "MiMo-V2-Pro", + "id": "qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ "text" @@ -71979,14 +80623,13 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -72001,93 +80644,62 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 1.2, + "output": 6 }, "type": "chat" }, { - "id": "mimo-v2.5", - "name": "MiMo-V2.5", - "display_name": "MiMo-V2.5", + "id": "devstral-2512", + "name": "Devstral 2", + "display_name": "Devstral 2", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "context_over_200k": { - "input": 0, - "output": 0, - "cache_read": 0 - } + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "mimo-v2-omni", - "name": "MiMo-V2-Omni", - "display_name": "MiMo-V2-Omni", + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -72095,26 +80707,16 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, + "cache_write": 0 }, "type": "chat" }, @@ -72157,78 +80759,32 @@ "release_date": "2026-04-22", "last_updated": "2026-04-22", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, + "input": 1, + "output": 3, + "cache_read": 0.2, "context_over_200k": { - "input": 0, - "output": 0, - "cache_read": 0 - } - }, - "type": "chat" - } - ] - }, - "zai": { - "id": "zai", - "name": "Z.AI", - "display_name": "Z.AI", - "api": "https://api.z.ai/api/paas/v4", - "doc": "https://docs.z.ai/guides/overview/pricing", - "models": [ - { - "id": "glm-5v-turbo", - "name": "GLM-5V-Turbo", - "display_name": "GLM-5V-Turbo", - "modalities": { - "input": [ - "text", - "image", - "video", - "pdf" - ], - "output": [ - "text" + "input": 2, + "output": 6, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } ] }, - "limit": { - "context": 200000, - "output": 131072 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", - "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24, - "cache_write": 0 - }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "minimax-m2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -72249,43 +80805,38 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "glm-4.5v", + "name": "GLM-4.5V", + "display_name": "GLM-4.5V", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 64000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -72293,33 +80844,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2, - "cache_write": 0 + "input": 0.6, + "output": 1.8 }, "type": "chat" }, { - "id": "glm-4.7-flashx", - "name": "GLM-4.7-FlashX", - "display_name": "GLM-4.7-FlashX", + "id": "glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ "text" @@ -72338,23 +80877,28 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, "knowledge": "2025-04", "release_date": "2026-01-19", "last_updated": "2026-01-19", "cost": { - "input": 0.07, - "output": 0.4, - "cache_read": 0.01, + "input": 0, + "output": 0, + "cache_read": 0, "cache_write": 0 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "qwen-flash", + "name": "Qwen Flash", + "display_name": "Qwen Flash", "modalities": { "input": [ "text" @@ -72364,8 +80908,8 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -72386,55 +80930,19 @@ }, "attachment": false, "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", - "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26, - "cache_write": 0 - }, - "type": "chat" - }, - { - "id": "glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 98304 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", + "knowledge": "2024-04", "release_date": "2025-07-28", "last_updated": "2025-07-28", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.05, + "output": 0.4 }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "devstral-small-2507", + "name": "Devstral Small", + "display_name": "Devstral Small", "modalities": { "input": [ "text" @@ -72444,105 +80952,57 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", - "cost": { - "input": 0.2, - "output": 1.1, - "cache_read": 0.03, - "cache_write": 0 - }, - "type": "chat" - }, - { - "id": "glm-5-turbo", - "name": "GLM-5-Turbo", - "display_name": "GLM-5-Turbo", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 131072 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "knowledge": "2025-05", + "release_date": "2025-07-10", + "last_updated": "2025-07-10", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24, - "cache_write": 0 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "glm-4.5v", - "name": "GLM-4.5V", - "display_name": "GLM-4.5V", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.6, - "output": 1.8 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, @@ -72587,44 +81047,9 @@ "type": "chat" }, { - "id": "glm-4.6v", - "name": "GLM-4.6V", - "display_name": "GLM-4.6V", - "modalities": { - "input": [ - "text", - "image", - "video" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", - "cost": { - "input": 0.3, - "output": 0.9 - }, - "type": "chat" - }, - { - "id": "glm-4.5-flash", - "name": "GLM-4.5-Flash", - "display_name": "GLM-4.5-Flash", + "id": "glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -72649,17 +81074,17 @@ "release_date": "2025-07-28", "last_updated": "2025-07-28", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, "cache_write": 0 }, "type": "chat" }, { - "id": "glm-4.7-flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "qwen-turbo", + "name": "Qwen Turbo", + "display_name": "Qwen Turbo", "modalities": { "input": [ "text" @@ -72669,8 +81094,8 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 1000000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -72680,35 +81105,31 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-11-01", + "last_updated": "2025-04-28", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.05, + "output": 0.2, + "reasoning": 0.5 }, "type": "chat" - } - ] - }, - "opencode": { - "id": "opencode", - "name": "OpenCode Zen", - "display_name": "OpenCode Zen", - "api": "https://opencode.ai/zen/v1", - "doc": "https://opencode.ai/docs/zen", - "models": [ + }, { - "id": "minimax-m2.7", - "name": "MiniMax M2.7", - "display_name": "MiniMax M2.7", + "id": "qwen-max", + "name": "Qwen Max", + "display_name": "Qwen Max", "modalities": { "input": [ "text" @@ -72718,56 +81139,44 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-04-03", + "last_updated": "2025-01-25", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 1.6, + "output": 6.4 }, "type": "chat" }, { - "id": "gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -72777,54 +81186,59 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", "effort_options": [ - "none", "low", "medium", "high" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 272000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -72832,73 +81246,66 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "gemma-3n-e2b-it", + "name": "Gemma 3n 2B", + "display_name": "Gemma 3n 2B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 8192, + "output": 2000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, "open_weights": true, "knowledge": "2024-10", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.08 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "minimax-m2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ "text" @@ -72930,65 +81337,55 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.1 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "glm-4.7-free", - "name": "GLM-4.7 Free", - "display_name": "GLM-4.7 Free", + "id": "gemma-3n-e4b-it", + "name": "Gemma 3n 4B", + "display_name": "Gemma 3n 4B", "modalities": { "input": [ "text" @@ -72998,48 +81395,35 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 8192, + "output": 2000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2024-10", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { "input": 0, - "output": 0, - "cache_read": 0 + "output": 0 }, "type": "chat" }, { - "id": "gemini-3.1-pro", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "gemini-2.5-flash-lite-preview-09-2025", + "name": "Gemini 2.5 Flash Lite Preview 09-25", + "display_name": "Gemini 2.5 Flash Lite Preview 09-25", "modalities": { "input": [ "text", "image", - "video", "audio", + "video", "pdf" ], "output": [ @@ -73054,18 +81438,20 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ @@ -73076,28 +81462,25 @@ "attachment": true, "open_weights": false, "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -73105,8 +81488,8 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -73118,45 +81501,38 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "mixed", + "mode": "budget", "budget": { - "min": 1024, + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, "unit": "tokens" }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.1, + "output": 0.4, + "cache_read": 0.01, + "input_audio": 0.3 }, "type": "chat" }, { - "id": "kimi-k2.5-free", - "name": "Kimi K2.5 Free", - "display_name": "Kimi K2.5 Free", + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ "text", @@ -73168,8 +81544,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -73188,34 +81564,52 @@ ] } }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "attachment": false, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 0.625, + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5 + }, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5, + "tier": { + "type": "context", + "size": 256000 + } + } + ] }, "type": "chat" }, { - "id": "claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -73229,35 +81623,31 @@ "supported": true, "default_enabled": false, "mode": "effort", - "effort": "high", + "effort": "none", "effort_options": [ + "none", "low", "medium", - "high", - "xhigh" + "high" ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, @@ -73318,105 +81708,9 @@ "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 400000, - "output": 128000 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", - "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 - }, - "type": "chat" - }, - { - "id": "minimax-m2.5-free", - "name": "MiniMax M2.5 Free", - "display_name": "MiniMax M2.5 Free", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 204800, - "output": 131072 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0 - }, - "type": "chat" - }, - { - "id": "ring-2.6-1t-free", - "name": "Ring 2.6 1T Free", - "display_name": "Ring 2.6 1T Free", + "id": "qwen3-coder-flash", + "name": "Qwen3 Coder Flash", + "display_name": "Qwen3 Coder Flash", "modalities": { "input": [ "text" @@ -73426,52 +81720,41 @@ ] }, "limit": { - "context": 262000, - "output": 66000 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-05-08", - "last_updated": "2026-05-08", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 1.5 }, "type": "chat" }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1050000, "output": 128000 }, "temperature": false, @@ -73505,110 +81788,87 @@ "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "deepseek-v4-flash-free", - "name": "DeepSeek V4 Flash Free", - "display_name": "DeepSeek V4 Flash Free", + "id": "gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "big-pickle", - "name": "Big Pickle", - "display_name": "Big Pickle", + "id": "gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-10-17", - "last_updated": "2025-10-17", + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "claude-opus-4-1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "claude-3-5-sonnet-20241022", + "name": "Claude Sonnet 3.5 v2", + "display_name": "Claude Sonnet 3.5 v2", "modalities": { "input": [ "text", @@ -73621,49 +81881,41 @@ }, "limit": { "context": 200000, - "output": 32000 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -73682,81 +81934,66 @@ ] } }, - "attachment": true, - "open_weights": false, + "attachment": false, + "open_weights": true, "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "cache_write": 0.625 + "input": 0.7, + "output": 2.8, + "reasoning": 8.4 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 Mini", - "display_name": "GPT-5.4 Mini", + "id": "qwen3-next-80b-a3b-thinking", + "name": "Qwen3-Next 80B-A3B (Thinking)", + "display_name": "Qwen3-Next 80B-A3B (Thinking)", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 0.5, + "output": 6 }, "type": "chat" }, { - "id": "claude-3-5-haiku", - "name": "Claude Haiku 3.5", - "display_name": "Claude Haiku 3.5", + "id": "claude-opus-4-5-20251101", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ "text", @@ -73769,41 +82006,7 @@ }, "limit": { "context": 200000, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", - "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 - }, - "type": "chat" - }, - { - "id": "minimax-m2.1", - "name": "MiniMax M2.1", - "display_name": "MiniMax M2.1", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 204800, - "output": 131072 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -73811,33 +82014,23 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.1 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -73847,8 +82040,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -73869,24 +82062,26 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-04-07", - "last_updated": "2026-04-07", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "gpt-5.4-nano", - "name": "GPT-5.4 Nano", - "display_name": "GPT-5.4 Nano", + "id": "gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "display_name": "Gemini 2.0 Flash Lite", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -73894,53 +82089,29 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "claude-opus-4-20250514", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ "text", @@ -73952,52 +82123,32 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex Mini", - "display_name": "GPT-5.1 Codex Mini", + "id": "gpt-5.4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", "modalities": { "input": [ "text", @@ -74027,7 +82178,8 @@ "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -74040,33 +82192,31 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "kimi-k2-thinking-turbo", + "name": "Kimi K2 Thinking Turbo", + "display_name": "Kimi K2 Thinking Turbo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -74074,43 +82224,43 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "cost": { + "input": 1.15, + "output": 8, + "cache_read": 0.15 + }, "type": "chat" }, { - "id": "gemini-3-flash", - "name": "Gemini 3 Flash", - "display_name": "Gemini 3 Flash", + "id": "mimo-v2-flash", + "name": "MiMo-V2-Flash", + "display_name": "MiMo-V2-Flash", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, @@ -74122,126 +82272,67 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", - "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 - }, - "type": "chat" - }, - { - "id": "trinity-large-preview-free", - "name": "Trinity Large Preview", - "display_name": "Trinity Large Preview", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131072 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, "attachment": false, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-01-28", - "last_updated": "2026-01-28", + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.3, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "claude-sonnet-4-5-20250929", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 1.07, - "output": 8.5, - "cache_read": 0.107 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gpt-5.4-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ "text", @@ -74253,8 +82344,8 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -74267,14 +82358,8 @@ "supported": true, "default_enabled": true, "mode": "effort", - "effort": "high", + "effort": "medium", "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -74284,20 +82369,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 30, - "output": 180, - "cache_read": 30 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "glm-5-free", - "name": "GLM-5 Free", - "display_name": "GLM-5 Free", + "id": "mimo-v2-pro", + "name": "MiMo-V2-Pro", + "display_name": "MiMo-V2-Pro", "modalities": { "input": [ "text" @@ -74307,7 +82392,7 @@ ] }, "limit": { - "context": 204800, + "context": 1048576, "output": 131072 }, "temperature": true, @@ -74328,63 +82413,108 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 1, + "output": 3, + "cache_read": 0.2, + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ] }, "type": "chat" }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "qwen-vl-plus", + "name": "Qwen-VL Plus", + "display_name": "Qwen-VL Plus", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-08-15", + "cost": { + "input": 0.21, + "output": 0.63 }, - "attachment": true, + "type": "chat" + }, + { + "id": "qwen-omni-turbo", + "name": "Qwen-Omni Turbo", + "display_name": "Qwen-Omni Turbo", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text", + "audio" + ] + }, + "limit": { + "context": 32768, + "output": 2048 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "knowledge": "2024-04", + "release_date": "2025-01-19", + "last_updated": "2025-03-26", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.07, + "output": 0.27, + "input_audio": 4.44, + "output_audio": 8.89 }, "type": "chat" }, { - "id": "minimax-m2.1-free", - "name": "MiniMax M2.1 Free", - "display_name": "MiniMax M2.1 Free", + "id": "glm-4.5-flash", + "name": "GLM-4.5-Flash", + "display_name": "GLM-4.5-Flash", "modalities": { "input": [ "text" @@ -74394,8 +82524,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -74403,30 +82533,90 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { "input": 0, "output": 0, - "cache_read": 0 + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen3.6-plus-free", - "name": "Qwen3.6 Plus Free", - "display_name": "Qwen3.6 Plus Free", + "id": "claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ + "text", + "image", + "pdf" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 1000000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "type": "chat" + }, + { + "id": "mimo-v2.5", + "name": "MiMo-V2.5", + "display_name": "MiMo-V2.5", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" ], "output": [ "text" @@ -74434,7 +82624,7 @@ }, "limit": { "context": 1048576, - "output": 64000 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -74453,22 +82643,38 @@ ] } }, - "attachment": false, - "open_weights": false, + "attachment": true, + "open_weights": true, "knowledge": "2024-12", - "release_date": "2026-03-30", - "last_updated": "2026-03-30", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.4, + "output": 2, + "cache_read": 0.08, + "context_over_200k": { + "input": 0.8, + "output": 4, + "cache_read": 0.16 + }, + "tiers": [ + { + "input": 0.8, + "output": 4, + "cache_read": 0.16, + "tier": { + "type": "context", + "size": 256000 + } + } + ] }, "type": "chat" }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -74478,8 +82684,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -74489,57 +82695,75 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.1 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "ling-2.6-flash-free", - "name": "Ling 2.6 Flash Free", - "display_name": "Ling 2.6 Flash Free", + "id": "gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262100, - "output": 32800 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "gemini-3-pro", - "name": "Gemini 3 Pro", - "display_name": "Gemini 3 Pro", + "id": "gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ "text", @@ -74582,8 +82806,8 @@ "attachment": true, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { "input": 2, "output": 12, @@ -74592,27 +82816,37 @@ "input": 4, "output": 18, "cache_read": 0.4 - } + }, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "grok-4-20-beta-0309-reasoning", + "name": "Grok 4.20 (Reasoning)", + "display_name": "Grok 4.20 (Reasoning)", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -74620,33 +82854,37 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "open_weights": false, + "release_date": "2026-03-09", + "last_updated": "2026-03-09", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 2, + "output": 6, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 12, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 4, + "output": 12, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "gpt-5-codex", - "name": "GPT-5 Codex", - "display_name": "GPT-5 Codex", + "id": "mistral-small-2506", + "name": "Mistral Small 3.2", + "display_name": "Mistral Small 3.2", "modalities": { "input": [ "text", @@ -74657,7 +82895,41 @@ ] }, "limit": { - "context": 400000, + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-03", + "release_date": "2025-06-20", + "last_updated": "2025-06-20", + "cost": { + "input": 0.1, + "output": 0.3 + }, + "type": "chat" + }, + { + "id": "gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1050000, "output": 128000 }, "temperature": false, @@ -74673,10 +82945,10 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "minimal", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -74689,31 +82961,51 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 1.07, - "output": 8.5, - "cache_read": 0.107 + "input": 5, + "output": 30, + "cache_read": 0.5, + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + }, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "grok-code", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -74721,25 +83013,48 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "release_date": "2025-08-20", - "last_updated": "2025-08-20", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "input_audio": 1 }, "type": "chat" }, { - "id": "mimo-v2-flash-free", - "name": "MiMo V2 Flash Free", - "display_name": "MiMo V2 Flash Free", + "id": "qwen3.6-35b-a3b", + "name": "Qwen3.6 35B-A3B", + "display_name": "Qwen3.6 35B-A3B", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" @@ -74766,32 +83081,31 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.248, + "output": 1.485 }, "type": "chat" }, { - "id": "gpt-5.3-codex-spark", - "name": "GPT-5.3 Codex Spark", - "display_name": "GPT-5.3 Codex Spark", + "id": "gpt-5.4-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 1050000, "output": 128000 }, "temperature": false, @@ -74805,9 +83119,8 @@ "supported": true, "default_enabled": true, "mode": "effort", - "effort": "medium", + "effort": "high", "effort_options": [ - "low", "medium", "high", "xhigh" @@ -74821,101 +83134,89 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 30, + "output": 180 }, "type": "chat" }, { - "id": "hy3-preview-free", - "name": "Hy3 preview Free", - "display_name": "Hy3 preview Free", + "id": "gpt-5.2-chat-latest", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-04-20", - "last_updated": "2026-04-20", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "mistral-large-latest", + "name": "Mistral Large (latest)", + "display_name": "Mistral Large (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "kimi-k2", - "name": "Kimi K2", - "display_name": "Kimi K2", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "Qwen3-Coder 480B-A35B Instruct", + "display_name": "Qwen3-Coder 480B-A35B Instruct", "modalities": { "input": [ "text" @@ -74926,7 +83227,7 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -74935,69 +83236,120 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.4, - "output": 2.5, - "cache_read": 0.4 + "input": 1.5, + "output": 7.5 }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "sonar-reasoning-pro", + "name": "Sonar Reasoning Pro", + "display_name": "Sonar Reasoning Pro", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true - } + "attachment": true, + "open_weights": false, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", + "cost": { + "input": 2, + "output": 8 + }, + "type": "chat" + }, + { + "id": "gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1047576, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5 - } + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "qwen3-coder", - "name": "Qwen3 Coder", - "display_name": "Qwen3 Coder", + "id": "gemma-3-12b-it", + "name": "Gemma 3 12B", + "display_name": "Gemma 3 12B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32768, + "output": 8192 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + }, + { + "id": "gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ "text" @@ -75007,29 +83359,29 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "attachment": true, + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0.45, - "output": 1.8 + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ "text", @@ -75040,8 +83392,8 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -75056,13 +83408,6 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -75072,81 +83417,91 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 1.07, - "output": 8.5, - "cache_read": 0.107 + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 }, "type": "chat" }, { - "id": "qwen3.5-plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.2, - "output": 1.2, - "cache_read": 0.02, - "cache_write": 0.25 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "mimo-v2-pro-free", - "name": "MiMo V2 Pro Free", - "display_name": "MiMo V2 Pro Free", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -75155,30 +83510,40 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "nemotron-3-super-free", - "name": "Nemotron 3 Super Free", - "display_name": "Nemotron 3 Super Free", + "id": "qwen3.6-max-preview", + "name": "Qwen3.6 Max Preview", + "display_name": "Qwen3.6 Max Preview", "modalities": { "input": [ "text" @@ -75188,8 +83553,8 @@ ] }, "limit": { - "context": 204800, - "output": 128000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -75209,25 +83574,28 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2026-02", - "release_date": "2026-03-11", - "last_updated": "2026-03-11", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-04-20", + "last_updated": "2026-04-20", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 1.3, + "output": 7.8, + "cache_read": 0.13, + "cache_write": 1.625 }, "type": "chat" }, { - "id": "gpt-5.5-pro", - "name": "GPT-5.5 Pro", - "display_name": "GPT-5.5 Pro", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -75235,42 +83603,8 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", - "cost": { - "input": 30, - "output": 180, - "cache_read": 30 - }, - "type": "chat" - }, - { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -75281,30 +83615,40 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.4, + "input": 0.3, "output": 2.5, - "cache_read": 0.4 + "cache_read": 0.03, + "input_audio": 1 }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ "text", @@ -75322,16 +83666,16 @@ "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", + "minimal", "low", "medium", "high" @@ -75347,81 +83691,31 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 1.07, - "output": 8.5, - "cache_read": 0.107 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "mimo-v2-omni-free", - "name": "MiMo V2 Omni Free", - "display_name": "MiMo V2 Omni Free", + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ - "text", - "image", - "audio", - "pdf" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 262144, - "output": 64000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0 - }, - "type": "chat" - }, - { - "id": "gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", - "modalities": { - "input": [ - "text", - "image", - "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -75436,13 +83730,6 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -75450,27 +83737,22 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", @@ -75482,23 +83764,22 @@ ] }, "limit": { - "context": 1050000, + "context": 400000, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", "low", "medium", "high", @@ -75516,17 +83797,12 @@ "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, @@ -75592,20 +83868,11 @@ "cache_write": 6.25 }, "type": "chat" - } - ] - }, - "stepfun": { - "id": "stepfun", - "name": "StepFun", - "display_name": "StepFun", - "api": "https://api.stepfun.com/v1", - "doc": "https://platform.stepfun.com/docs/zh/overview/concept", - "models": [ + }, { - "id": "step-3.5-flash-2603", - "name": "Step 3.5 Flash 2603", - "display_name": "Step 3.5 Flash 2603", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder 30B-A3B Instruct", + "display_name": "Qwen3-Coder 30B-A3B Instruct", "modalities": { "input": [ "text" @@ -75615,31 +83882,29 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.02 + "input": 0.45, + "output": 2.25 }, "type": "chat" }, { - "id": "step-1-32k", - "name": "Step 1 (32K)", - "display_name": "Step 1 (32K)", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -75649,31 +83914,29 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-01-01", - "last_updated": "2026-02-13", + "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 2.05, - "output": 9.59, - "cache_read": 0.41 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "step-3.5-flash", - "name": "Step 3.5 Flash", - "display_name": "Step 3.5 Flash", + "id": "qwen3-next-80b-a3b-instruct", + "name": "Qwen3-Next 80B-A3B Instruct", + "display_name": "Qwen3-Next 80B-A3B Instruct", "modalities": { "input": [ "text" @@ -75683,74 +83946,29 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-29", - "last_updated": "2026-02-13", + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 0.096, - "output": 0.288, - "cache_read": 0.019 + "input": 0.5, + "output": 2 }, "type": "chat" }, { - "id": "step-2-16k", - "name": "Step 2 (16K)", - "display_name": "Step 2 (16K)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 16384, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-01-01", - "last_updated": "2026-02-13", - "cost": { - "input": 5.21, - "output": 16.44, - "cache_read": 1.04 - }, - "type": "chat" - } - ] - }, - "nebius": { - "id": "nebius", - "name": "Nebius Token Factory", - "display_name": "Nebius Token Factory", - "api": "https://api.tokenfactory.nebius.com/v1", - "doc": "https://docs.tokenfactory.nebius.com/", - "models": [ - { - "id": "NousResearch/Hermes-4-70B", - "name": "Hermes-4-70B", - "display_name": "Hermes-4-70B", + "id": "minimax-m2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "display_name": "MiniMax-M2.5-highspeed", "modalities": { "input": [ "text" @@ -75760,8 +83978,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -75771,33 +83989,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2025-11", - "release_date": "2026-01-30", - "last_updated": "2026-02-04", + "release_date": "2026-02-13", + "last_updated": "2026-02-13", "cost": { - "input": 0.13, - "output": 0.4, - "reasoning": 0.4, - "cache_read": 0.013, - "cache_write": 0.16 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "NousResearch/Hermes-4-405B", - "name": "Hermes-4-405B", - "display_name": "Hermes-4-405B", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -75807,8 +84017,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -75829,33 +84039,35 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-11", - "release_date": "2026-01-30", - "last_updated": "2026-02-04", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 1, - "output": 3, - "reasoning": 3, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-72B-Instruct", - "name": "Qwen2.5-VL-72B-Instruct", - "display_name": "Qwen2.5-VL-72B-Instruct", + "id": "gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 1048576, "output": 8192 }, "temperature": true, @@ -75864,145 +84076,141 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-20", - "last_updated": "2026-02-04", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.25, - "output": 0.75, - "cache_read": 0.025, - "cache_write": 0.31 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-397B-A17B", - "name": "Qwen3.5-397B-A17B", - "display_name": "Qwen3.5-397B-A17B", + "id": "claude-3-7-sonnet-20250219", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-15", - "last_updated": "2026-05-07", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.6, - "output": 3.6, - "cache_read": 0.06, - "cache_write": 0.75 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Embedding-8B", - "name": "Qwen3-Embedding-8B", - "display_name": "Qwen3-Embedding-8B", + "id": "o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 200000, + "output": 100000 }, "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-10", - "release_date": "2026-01-10", - "last_updated": "2026-02-04", - "cost": { - "input": 0.01, - "output": 0 - }, - "type": "embedding" - }, - { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen3-30B-A3B-Instruct-2507", - "display_name": "Qwen3-30B-A3B-Instruct-2507", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 8192 - }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-01-28", - "last_updated": "2026-02-04", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01, - "cache_write": 0.125 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "claude-sonnet-4-20250514", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -76010,112 +84218,89 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-25", - "last_updated": "2025-10-04", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.2, - "output": 0.6 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "Qwen/Qwen3-32B", - "name": "Qwen3-32B", - "display_name": "Qwen3-32B", + "id": "qwen-vl-max", + "name": "Qwen-VL Max", + "display_name": "Qwen-VL Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-01-28", - "last_updated": "2026-02-04", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-04-08", + "last_updated": "2025-08-13", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01, - "cache_write": 0.125 + "input": 0.8, + "output": 3.2 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507-fast", - "name": "Qwen3-235B-A22B-Thinking-2507-fast", - "display_name": "Qwen3-235B-A22B-Thinking-2507-fast", + "id": "gemma-3-4b-it", + "name": "Gemma 3 4B", + "display_name": "Gemma 3 4B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8000, + "context": 32768, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-25", - "last_updated": "2026-05-07", + "knowledge": "2024-10", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 0.5, - "output": 2, - "cache_read": 0.05, - "cache_write": 0.625 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-397B-A17B-fast", - "name": "Qwen3.5-397B-A17B-fast", - "display_name": "Qwen3.5-397B-A17B-fast", + "id": "qwen-plus", + "name": "Qwen Plus", + "display_name": "Qwen Plus", "modalities": { "input": [ "text" @@ -76125,8 +84310,8 @@ ] }, "limit": { - "context": 8000, - "output": 8192 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -76146,22 +84331,21 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-15", - "last_updated": "2026-05-07", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-09-11", "cost": { - "input": 0.6, - "output": 3.6, - "cache_read": 0.06, - "cache_write": 0.75 + "input": 0.4, + "output": 1.2, + "reasoning": 4 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Thinking-fast", - "name": "Qwen3-Next-80B-A3B-Thinking-fast", - "display_name": "Qwen3-Next-80B-A3B-Thinking-fast", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -76171,8 +84355,8 @@ ] }, "limit": { - "context": 8000, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -76193,68 +84377,69 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-25", - "last_updated": "2026-05-07", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.15, - "output": 1.2, - "cache_read": 0.015, - "cache_write": 0.1875 + "input": 1, + "output": 3.2, + "cache_read": 0.2, + "cache_write": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "name": "Qwen3-Next-80B-A3B-Thinking", - "display_name": "Qwen3-Next-80B-A3B-Thinking", + "id": "grok-4-20-beta-0309-non-reasoning", + "name": "Grok 4.20 (Non-Reasoning)", + "display_name": "Grok 4.20 (Non-Reasoning)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-01-28", - "last_updated": "2026-02-04", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-09", + "last_updated": "2026-03-09", "cost": { - "input": 0.15, - "output": 1.2, - "reasoning": 1.2, - "cache_read": 0.015, - "cache_write": 0.18 + "input": 2, + "output": 6, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 12, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 4, + "output": 12, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "PrimeIntellect/INTELLECT-3", - "name": "INTELLECT-3", - "display_name": "INTELLECT-3", + "id": "qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", "modalities": { "input": [ "text" @@ -76264,8 +84449,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -76274,32 +84459,32 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-10", - "release_date": "2026-01-25", - "last_updated": "2026-02-04", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.2, - "output": 1.1, - "cache_read": 0.02, - "cache_write": 0.25 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "zai-org/GLM-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -76318,60 +84503,60 @@ ] } }, - "attachment": false, - "open_weights": false, - "knowledge": "2026-01", - "release_date": "2026-03-01", - "last_updated": "2026-03-10", + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.1, - "cache_write": 1 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "sonar-pro", + "name": "Sonar Pro", + "display_name": "Sonar Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 200000, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-12-05", - "last_updated": "2026-02-04", + "attachment": true, + "open_weights": false, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 0.13, - "output": 0.4, - "cache_read": 0.013, - "cache_write": 0.16 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -76379,40 +84564,6 @@ }, "limit": { "context": 128000, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2024-07-23", - "last_updated": "2026-02-04", - "cost": { - "input": 0.02, - "output": 0.06, - "cache_read": 0.002, - "cache_write": 0.025 - }, - "type": "chat" - }, - { - "id": "nvidia/nemotron-3-super-120b-a12b", - "name": "Nemotron-3-Super-120B-A12B", - "display_name": "Nemotron-3-Super-120B-A12B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, "output": 32768 }, "temperature": true, @@ -76421,11 +84572,11 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2026-02", - "release_date": "2026-03-11", - "last_updated": "2026-03-12", + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { "input": 0.3, "output": 0.9 @@ -76433,242 +84584,56 @@ "type": "chat" }, { - "id": "nvidia/Llama-3_1-Nemotron-Ultra-253B-v1", - "name": "Llama-3.1-Nemotron-Ultra-253B-v1", - "display_name": "Llama-3.1-Nemotron-Ultra-253B-v1", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-15", - "last_updated": "2026-02-04", - "cost": { - "input": 0.6, - "output": 1.8, - "cache_read": 0.06, - "cache_write": 0.75 - }, - "type": "chat" - }, - { - "id": "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B", - "name": "Nemotron-3-Nano-30B-A3B", - "display_name": "Nemotron-3-Nano-30B-A3B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32000, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-08-10", - "last_updated": "2026-02-04", - "cost": { - "input": 0.06, - "output": 0.24, - "cache_read": 0.006, - "cache_write": 0.075 - }, - "type": "chat" - }, - { - "id": "nvidia/Nemotron-3-Nano-Omni", - "name": "Nemotron-3-Nano-Omni", - "display_name": "Nemotron-3-Nano-Omni", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 65536, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01-20", - "last_updated": "2026-05-07", - "cost": { - "input": 0.06, - "output": 0.24, - "cache_read": 0.006, - "cache_write": 0.075 - }, - "type": "chat" - }, - { - "id": "deepseek-ai/DeepSeek-V3.2-fast", - "name": "DeepSeek-V3.2-fast", - "display_name": "DeepSeek-V3.2-fast", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8000, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2026-05-07", - "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.04, - "cache_write": 0.5 - }, - "type": "chat" - }, - { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 163000, - "output": 16384 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-11", - "release_date": "2026-01-20", - "last_updated": "2026-02-04", - "cost": { - "input": 0.3, - "output": 0.45, - "reasoning": 0.45, - "cache_read": 0.03, - "cache_write": 0.375 - }, - "type": "chat" - }, - { - "id": "openai/gpt-oss-120b-fast", - "name": "gpt-oss-120b-fast", - "display_name": "gpt-oss-120b-fast", + "id": "pixtral-large-latest", + "name": "Pixtral Large (latest)", + "display_name": "Pixtral Large (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, - "limit": { - "context": 8000, - "output": 8192 + "limit": { + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-06-10", - "last_updated": "2026-05-07", + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2024-11-04", "cost": { - "input": 0.1, - "output": 0.5, - "cache_read": 0.01, - "cache_write": 0.125 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -76677,335 +84642,264 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-09", - "release_date": "2026-01-10", - "last_updated": "2026-02-04", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.15, - "output": 0.6, - "reasoning": 0.6, - "cache_read": 0.015, - "cache_write": 0.18 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "google/gemma-2-2b-it", - "name": "Gemma-2-2b-it", - "display_name": "Gemma-2-2b-it", + "id": "gpt-5.3-chat-latest", + "name": "GPT-5.3 Chat (latest)", + "display_name": "GPT-5.3 Chat (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2024-07-31", - "last_updated": "2026-02-04", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.02, - "output": 0.06, - "cache_read": 0.002, - "cache_write": 0.025 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" - }, + } + ] + }, + "poe": { + "id": "poe", + "name": "Poe", + "display_name": "Poe", + "api": "https://api.poe.com/v1", + "doc": "https://creator.poe.com/docs/external-applications/openai-compatible-api", + "models": [ { - "id": "google/gemma-3-27b-it", - "name": "Gemma-3-27b-it", - "display_name": "Gemma-3-27b-it", + "id": "ideogramai/ideogram-v2a-turbo", + "name": "Ideogram-v2a-Turbo", + "display_name": "Ideogram-v2a-Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 110000, + "context": 150, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-10", - "release_date": "2026-01-20", - "last_updated": "2026-02-04", - "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01, - "cache_write": 0.125 - }, + "open_weights": false, + "release_date": "2025-02-27", + "last_updated": "2025-02-27", "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5-fast", - "name": "Kimi-K2.5-fast", - "display_name": "Kimi-K2.5-fast", + "id": "ideogramai/ideogram-v2", + "name": "Ideogram-v2", + "display_name": "Ideogram-v2", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 256000, + "context": 150, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-12-15", - "last_updated": "2026-02-04", - "cost": { - "input": 0.5, - "output": 2.5, - "cache_read": 0.05, - "cache_write": 0.625 - }, + "open_weights": false, + "release_date": "2024-08-21", + "last_updated": "2024-08-21", "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi-K2.5", - "display_name": "Kimi-K2.5", + "id": "ideogramai/ideogram", + "name": "Ideogram", + "display_name": "Ideogram", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 256000, + "context": 150, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-12-15", - "last_updated": "2026-02-04", - "cost": { - "input": 0.5, - "output": 2.5, - "reasoning": 2.5, - "cache_read": 0.05, - "cache_write": 0.625 - }, + "open_weights": false, + "release_date": "2024-04-03", + "last_updated": "2024-04-03", "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "ideogramai/ideogram-v2a", + "name": "Ideogram-v2a", + "display_name": "Ideogram-v2a", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 196608, + "context": 150, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01-20", - "last_updated": "2026-05-07", - "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.375 + "supported": false }, + "attachment": true, + "open_weights": false, + "release_date": "2025-02-27", + "last_updated": "2025-02-27", "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5-fast", - "name": "MiniMax-M2.5-fast", - "display_name": "MiniMax-M2.5-fast", + "id": "openai/chatgpt-4o-latest", + "name": "ChatGPT-4o-Latest", + "display_name": "ChatGPT-4o-Latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8000, + "context": 128000, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01-20", - "last_updated": "2026-05-07", + "attachment": true, + "open_weights": false, + "release_date": "2024-08-14", + "last_updated": "2024-08-14", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 4.5, + "output": 14 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V4-Pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 128000, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", - "cost": { - "input": 1.75, - "output": 3.5, - "cache_read": 0.15 + "supported": false }, + "attachment": true, + "open_weights": false, + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "type": "chat" - } - ] - }, - "poe": { - "id": "poe", - "name": "Poe", - "display_name": "Poe", - "api": "https://api.poe.com/v1", - "doc": "https://creator.poe.com/docs/external-applications/openai-compatible-api", - "models": [ + }, { - "id": "topazlabs-co/topazlabs", - "name": "TopazLabs", - "display_name": "TopazLabs", + "id": "openai/gpt-image-1-mini", + "name": "GPT-Image-1-Mini", + "display_name": "GPT-Image-1-Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "image" ] }, "limit": { - "context": 204, + "context": 8192, "output": 8192 }, "temperature": false, @@ -77015,112 +84909,116 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-12-03", - "last_updated": "2024-12-03", - "type": "chat" + "release_date": "2025-08-26", + "last_updated": "2025-08-26", + "type": "imageGeneration" }, { - "id": "novita/kimi-k2.5", - "name": "Kimi-K2.5", - "display_name": "Kimi-K2.5", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 1.6, + "output": 13, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "novita/glm-4.7", - "name": "glm-4.7", - "display_name": "glm-4.7", + "id": "openai/gpt-3.5-turbo", + "name": "GPT-3.5-Turbo", + "display_name": "GPT-3.5-Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 205000, - "output": 131072 + "context": 16384, + "output": 2048 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2023-09-13", + "last_updated": "2023-09-13", + "cost": { + "input": 0.45, + "output": 1.4 + }, "type": "chat" }, { - "id": "novita/glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "openai/o3-pro", + "name": "o3-pro", + "display_name": "o3-pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 205000, - "output": 131072 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -77129,68 +85027,71 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-15", - "last_updated": "2026-02-15", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 18, + "output": 72 }, "type": "chat" }, { - "id": "novita/minimax-m2.1", - "name": "minimax-m2.1", - "display_name": "minimax-m2.1", + "id": "openai/gpt-5.3-instant", + "name": "GPT-5.3-Instant", + "display_name": "GPT-5.3-Instant", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 205000, - "output": 131072 + "context": 128000, + "output": 16384 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-12-26", - "last_updated": "2025-12-26", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", + "cost": { + "input": 1.6, + "output": 13, + "cache_read": 0.16 + }, "type": "chat" }, { - "id": "novita/glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "openai/sora-2-pro", + "name": "Sora-2-Pro", + "display_name": "Sora-2-Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "video" ] }, "limit": { @@ -77200,93 +85101,107 @@ "temperature": false, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "type": "chat" }, { - "id": "novita/kimi-k2.6", - "name": "Kimi-K2.6", - "display_name": "Kimi-K2.6", + "id": "openai/gpt-5.4-nano", + "name": "GPT-5.4-Nano", + "display_name": "GPT-5.4-Nano", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-04-20", - "last_updated": "2026-05-02", + "open_weights": false, + "release_date": "2026-03-11", + "last_updated": "2026-03-11", "cost": { - "input": 0.96, - "output": 4.04, - "cache_read": 0.16 + "input": 0.18, + "output": 1.1, + "cache_read": 0.018 }, "type": "chat" }, { - "id": "novita/glm-4.6v", - "name": "glm-4.6v", - "display_name": "glm-4.6v", + "id": "openai/gpt-image-2", + "name": "GPT-Image-2", + "display_name": "GPT-Image-2", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 131000, - "output": 32768 + "context": 8192, + "output": 8192 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-12-09", - "last_updated": "2025-12-09", - "type": "chat" + "release_date": "2026-04-21", + "last_updated": "2026-04-21", + "cost": { + "input": 5.0505, + "output": 32.3232, + "cache_read": 1.2626 + }, + "type": "imageGeneration" }, { - "id": "novita/deepseek-v3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "openai/gpt-4o-mini-search", + "name": "GPT-4o-mini-Search", + "display_name": "GPT-4o-mini-Search", "modalities": { "input": [ "text" @@ -77299,32 +85214,25 @@ "context": 128000, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "open_weights": false, + "release_date": "2025-03-11", + "last_updated": "2025-03-11", "cost": { - "input": 0.27, - "output": 0.4, - "cache_read": 0.13 + "input": 0.14, + "output": 0.54 }, "type": "chat" }, { - "id": "novita/glm-4.7-flash", - "name": "glm-4.7-flash", - "display_name": "glm-4.7-flash", + "id": "openai/gpt-5.1-codex-mini", + "name": "GPT-5.1-Codex-Mini", + "display_name": "GPT-5.1-Codex-Mini", "modalities": { "input": [ "text" @@ -77334,41 +85242,63 @@ ] }, "limit": { - "context": 200000, - "output": 65500 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "release_date": "2025-11-12", + "last_updated": "2025-11-12", + "cost": { + "input": 0.22, + "output": 1.8, + "cache_read": 0.022 + }, "type": "chat" }, { - "id": "novita/glm-4.7-n", - "name": "glm-4.7-n", - "display_name": "glm-4.7-n", + "id": "openai/gpt-5.2-pro", + "name": "GPT-5.2-Pro", + "display_name": "GPT-5.2-Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 205000, - "output": 131072 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -77376,67 +85306,84 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 19, + "output": 150 + }, "type": "chat" }, { - "id": "novita/kimi-k2-thinking", - "name": "kimi-k2-thinking", - "display_name": "kimi-k2-thinking", + "id": "openai/gpt-4-classic-0314", + "name": "GPT-4-Classic-0314", + "display_name": "GPT-4-Classic-0314", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 8192, + "output": 4096 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-11-07", - "last_updated": "2025-11-07", + "release_date": "2024-08-26", + "last_updated": "2024-08-26", + "cost": { + "input": 27, + "output": 54 + }, "type": "chat" }, { - "id": "fireworks-ai/kimi-k2.5-fw", - "name": "Kimi-K2.5-FW", - "display_name": "Kimi-K2.5-FW", + "id": "openai/sora-2", + "name": "Sora-2", + "display_name": "Sora-2", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 8192, + "output": 8192 }, "temperature": false, "tool_call": true, @@ -77445,18 +85392,14 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "type": "chat" }, { - "id": "empiriolabs/deepseek-v4-pro-el", - "name": "DeepSeek-V4-Pro-EL", - "display_name": "DeepSeek-V4-Pro-EL", + "id": "openai/gpt-5.3-codex-spark", + "name": "GPT-5.3-Codex-Spark", + "display_name": "GPT-5.3-Codex-Spark", "modalities": { "input": [ "text" @@ -77466,92 +85409,143 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 128000, + "output": 16384 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-24", - "last_updated": "2026-05-02", + "open_weights": false, + "release_date": "2026-03-04", + "last_updated": "2026-03-04", "cost": { - "input": 1.67, - "output": 3.33 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "empiriolabs/deepseek-v4-flash-el", - "name": "DeepSeek-V4-Flash-EL", - "display_name": "DeepSeek-V4-Flash-EL", + "id": "openai/gpt-3.5-turbo-instruct", + "name": "GPT-3.5-Turbo-Instruct", + "display_name": "GPT-3.5-Turbo-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 3500, + "output": 1024 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-24", - "last_updated": "2026-05-02", + "open_weights": false, + "release_date": "2023-09-20", + "last_updated": "2023-09-20", "cost": { - "input": 0.14, - "output": 0.28 + "input": 1.4, + "output": 1.8 }, "type": "chat" }, { - "id": "elevenlabs/elevenlabs-v2.5-turbo", - "name": "ElevenLabs-v2.5-Turbo", - "display_name": "ElevenLabs-v2.5-Turbo", + "id": "openai/gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2024-10-28", - "last_updated": "2024-10-28", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", + "cost": { + "input": 1.1, + "output": 9 + }, "type": "chat" }, { - "id": "elevenlabs/elevenlabs-v3", - "name": "ElevenLabs-v3", - "display_name": "ElevenLabs-v3", + "id": "openai/gpt-image-1.5", + "name": "gpt-image-1.5", + "display_name": "gpt-image-1.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "audio" + "image" ] }, "limit": { @@ -77559,31 +85553,32 @@ "output": 8192 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", - "type": "chat" + "release_date": "2025-12-16", + "last_updated": "2025-12-16", + "type": "imageGeneration" }, { - "id": "elevenlabs/elevenlabs-music", - "name": "ElevenLabs-Music", - "display_name": "ElevenLabs-Music", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 2000, - "output": 8192 + "context": 1047576, + "output": 32768 }, "temperature": false, "tool_call": true, @@ -77592,25 +85587,31 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-08-29", - "last_updated": "2025-08-29", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 1.8, + "output": 7.2, + "cache_read": 0.45 + }, "type": "chat" }, { - "id": "cerebras/gpt-oss-120b-cs", - "name": "GPT-OSS-120B-CS", - "display_name": "GPT-OSS-120B-CS", + "id": "openai/gpt-5-pro", + "name": "GPT-5-Pro", + "display_name": "GPT-5-Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -77618,31 +85619,47 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 0.35, - "output": 0.75 + "input": 14, + "output": 110 }, "type": "chat" }, { - "id": "cerebras/llama-3.1-8b-cs", - "name": "Llama-3.1-8B-CS", - "display_name": "Llama-3.1-8B-CS", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1-mini", + "display_name": "GPT-4.1-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1047576, + "output": 32768 }, "temperature": false, "tool_call": true, @@ -77651,167 +85668,251 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-05-13", - "last_updated": "2025-05-13", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.36, + "output": 1.4, + "cache_read": 0.09 }, "type": "chat" }, { - "id": "cerebras/qwen3-32b-cs", - "name": "qwen3-32b-cs", - "display_name": "qwen3-32b-cs", + "id": "openai/gpt-3.5-turbo-raw", + "name": "GPT-3.5-Turbo-Raw", + "display_name": "GPT-3.5-Turbo-Raw", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 4524, + "output": 2048 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-05-15", - "last_updated": "2025-05-15", + "release_date": "2023-09-27", + "last_updated": "2023-09-27", + "cost": { + "input": 0.45, + "output": 1.4 + }, "type": "chat" }, { - "id": "cerebras/qwen3-235b-2507-cs", - "name": "qwen3-235b-2507-cs", - "display_name": "qwen3-235b-2507-cs", + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", + "release_date": "2025-11-12", + "last_updated": "2025-11-12", + "cost": { + "input": 1.1, + "output": 9, + "cache_read": 0.11 + }, "type": "chat" }, { - "id": "cerebras/llama-3.3-70b-cs", - "name": "llama-3.3-70b-cs", - "display_name": "llama-3.3-70b-cs", + "id": "openai/gpt-5-nano", + "name": "GPT-5-nano", + "display_name": "GPT-5-nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-05-13", - "last_updated": "2025-05-13", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.045, + "output": 0.36, + "cache_read": 0.0045 + }, "type": "chat" }, { - "id": "stabilityai/stablediffusionxl", - "name": "StableDiffusionXL", - "display_name": "StableDiffusionXL", + "id": "openai/gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "image" ] }, "limit": { - "context": 200, - "output": 8192 + "context": 1050000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2023-07-09", - "last_updated": "2023-07-09", + "release_date": "2026-02-26", + "last_updated": "2026-02-26", + "cost": { + "input": 2.2, + "output": 14, + "cache_read": 0.22 + }, "type": "chat" }, { - "id": "xai/grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o-mini", + "display_name": "GPT-4o-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 124096, + "output": 4096 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-08-22", - "last_updated": "2025-08-22", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 0.14, + "output": 0.54, + "cache_read": 0.068 }, "type": "chat" }, { - "id": "xai/grok-4-fast-reasoning", - "name": "Grok-4-Fast-Reasoning", - "display_name": "Grok-4-Fast-Reasoning", + "id": "openai/o1-pro", + "name": "o1-pro", + "display_name": "o1-pro", "modalities": { "input": [ "text", @@ -77822,8 +85923,8 @@ ] }, "limit": { - "context": 2000000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -77833,24 +85934,32 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-09-16", - "last_updated": "2025-09-16", + "release_date": "2025-03-19", + "last_updated": "2025-03-19", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 140, + "output": 540 }, "type": "chat" }, { - "id": "xai/grok-4.1-fast-non-reasoning", - "name": "Grok-4.1-Fast-Non-Reasoning", - "display_name": "Grok-4.1-Fast-Non-Reasoning", + "id": "openai/gpt-4-turbo", + "name": "GPT-4-Turbo", + "display_name": "GPT-4-Turbo", "modalities": { "input": [ "text", @@ -77861,8 +85970,8 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 4096 }, "temperature": false, "tool_call": true, @@ -77871,86 +85980,101 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "release_date": "2023-09-13", + "last_updated": "2023-09-13", + "cost": { + "input": 9, + "output": 27 + }, "type": "chat" }, { - "id": "xai/grok-4", - "name": "Grok-4", - "display_name": "Grok-4", + "id": "openai/dall-e-3", + "name": "DALL-E-3", + "display_name": "DALL-E-3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 800, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-07-10", - "last_updated": "2025-07-10", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 - }, - "type": "chat" + "release_date": "2023-11-06", + "last_updated": "2023-11-06", + "type": "imageGeneration" }, { - "id": "xai/grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "openai/gpt-5.4-mini", + "name": "GPT-5.4-Mini", + "display_name": "GPT-5.4-Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-04-11", - "last_updated": "2025-04-11", + "release_date": "2026-03-12", + "last_updated": "2026-03-12", "cost": { - "input": 0.3, - "output": 0.5, - "cache_read": 0.075 + "input": 0.68, + "output": 4, + "cache_read": 0.068 }, "type": "chat" }, { - "id": "xai/grok-4.20-multi-agent", - "name": "Grok-4.20-Multi-Agent", - "display_name": "Grok-4.20-Multi-Agent", + "id": "openai/gpt-5.1-instant", + "name": "GPT-5.1-Instant", + "display_name": "GPT-5.1-Instant", "modalities": { "input": [ "text", @@ -77962,38 +86086,61 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 16384 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2026-03-13", - "last_updated": "2026-03-13", + "release_date": "2025-11-12", + "last_updated": "2025-11-12", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2 + "input": 1.1, + "output": 9, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "xai/grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "openai/gpt-4o-aug", + "name": "GPT-4o-Aug", + "display_name": "GPT-4o-Aug", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, "temperature": false, @@ -78003,19 +86150,19 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-04-11", - "last_updated": "2025-04-11", + "release_date": "2024-11-21", + "last_updated": "2024-11-21", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 2.2, + "output": 9, + "cache_read": 1.1 }, "type": "chat" }, { - "id": "xai/grok-4-fast-non-reasoning", - "name": "Grok-4-Fast-Non-Reasoning", - "display_name": "Grok-4-Fast-Non-Reasoning", + "id": "openai/o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ "text", @@ -78026,29 +86173,43 @@ ] }, "limit": { - "context": 2000000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-09-16", - "last_updated": "2025-09-16", + "release_date": "2024-12-18", + "last_updated": "2024-12-18", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 14, + "output": 54 }, "type": "chat" }, { - "id": "xai/grok-4.1-fast-reasoning", - "name": "Grok-4.1-Fast-Reasoning", - "display_name": "Grok-4.1-Fast-Reasoning", + "id": "openai/o3-mini-high", + "name": "o3-mini-high", + "display_name": "o3-mini-high", "modalities": { "input": [ "text", @@ -78059,8 +86220,8 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -78068,28 +86229,46 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", + "cost": { + "input": 0.99, + "output": 4 + }, "type": "chat" }, { - "id": "runwayml/runway", - "name": "Runway", - "display_name": "Runway", + "id": "openai/gpt-4-classic", + "name": "GPT-4-Classic", + "display_name": "GPT-4-Classic", "modalities": { "input": [ "text", "image" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 256, - "output": 8192 + "context": 8192, + "output": 4096 }, "temperature": false, "tool_call": true, @@ -78098,25 +86277,28 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-10-11", - "last_updated": "2024-10-11", + "release_date": "2024-03-25", + "last_updated": "2024-03-25", + "cost": { + "input": 27, + "output": 54 + }, "type": "chat" }, { - "id": "runwayml/runway-gen-4-turbo", - "name": "Runway-Gen-4-Turbo", - "display_name": "Runway-Gen-4-Turbo", + "id": "openai/gpt-4o-search", + "name": "GPT-4o-Search", + "display_name": "GPT-4o-Search", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 256, + "context": 128000, "output": 8192 }, "temperature": false, @@ -78126,8 +86308,12 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-05-09", - "last_updated": "2025-05-09", + "release_date": "2025-03-11", + "last_updated": "2025-03-11", + "cost": { + "input": 2.2, + "output": 9 + }, "type": "chat" }, { @@ -78186,37 +86372,109 @@ "type": "chat" }, { - "id": "openai/sora-2-pro", - "name": "Sora-2-Pro", - "display_name": "Sora-2-Pro", + "id": "openai/gpt-5.4-pro", + "name": "GPT-5.4-Pro", + "display_name": "GPT-5.4-Pro", "modalities": { "input": [ "text", "image" ], "output": [ - "video" + "image" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1050000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", + "cost": { + "input": 27, + "output": 160 + }, "type": "chat" }, { - "id": "openai/chatgpt-4o-latest", - "name": "ChatGPT-4o-Latest", - "display_name": "ChatGPT-4o-Latest", + "id": "openai/o4-mini-deep-research", + "name": "o4-mini-deep-research", + "display_name": "o4-mini-deep-research", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-06-27", + "last_updated": "2025-06-27", + "cost": { + "input": 1.8, + "output": 7.2, + "cache_read": 0.45 + }, + "type": "chat" + }, + { + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1-nano", + "display_name": "GPT-4.1-nano", "modalities": { "input": [ "text", @@ -78227,8 +86485,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1047576, + "output": 32768 }, "temperature": false, "tool_call": true, @@ -78237,18 +86495,19 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-08-14", - "last_updated": "2024-08-14", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 4.5, - "output": 14 + "input": 0.09, + "output": 0.36, + "cache_read": 0.022 }, "type": "chat" }, { - "id": "openai/gpt-5-chat", - "name": "GPT-5-Chat", - "display_name": "GPT-5-Chat", + "id": "openai/o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ "text", @@ -78259,29 +86518,44 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 + "input": 0.99, + "output": 4, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "openai/gpt-5.2-pro", - "name": "GPT-5.2-Pro", - "display_name": "GPT-5.2-Pro", + "id": "openai/gpt-5.1-codex", + "name": "GPT-5.1-Codex", + "display_name": "GPT-5.1-Codex", "modalities": { "input": [ "text", @@ -78299,18 +86573,19 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "high", + "effort": "none", "effort_options": [ + "none", + "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -78323,18 +86598,19 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2025-11-12", + "last_updated": "2025-11-12", "cost": { - "input": 19, - "output": 150 + "input": 1.1, + "output": 9, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "openai/gpt-4o-aug", - "name": "GPT-4o-Aug", - "display_name": "GPT-4o-Aug", + "id": "openai/gpt-5.2-codex", + "name": "GPT-5.2-Codex", + "display_name": "GPT-5.2-Codex", "modalities": { "input": [ "text", @@ -78345,74 +86621,96 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2024-11-21", - "last_updated": "2024-11-21", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 2.2, - "output": 9, - "cache_read": 1.1 + "input": 1.6, + "output": 13, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "openai/gpt-image-2", - "name": "GPT-Image-2", - "display_name": "GPT-Image-2", + "id": "openai/gpt-5-chat", + "name": "GPT-5-Chat", + "display_name": "GPT-5-Chat", "modalities": { "input": [ "text", "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 5.0505, - "output": 32.3232, - "cache_read": 1.2626 + "input": 1.1, + "output": 9, + "cache_read": 0.11 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-4-classic-0314", - "name": "GPT-4-Classic-0314", - "display_name": "GPT-4-Classic-0314", + "id": "openai/gpt-image-1", + "name": "GPT-Image-1", + "display_name": "GPT-Image-1", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 128000, + "output": 8192 }, "temperature": false, "tool_call": true, @@ -78421,13 +86719,9 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-08-26", - "last_updated": "2024-08-26", - "cost": { - "input": 27, - "output": 54 - }, - "type": "chat" + "release_date": "2025-03-31", + "last_updated": "2025-03-31", + "type": "imageGeneration" }, { "id": "openai/gpt-5-mini", @@ -78485,9 +86779,9 @@ "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "GPT-5-nano", - "display_name": "GPT-5-nano", + "id": "openai/o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text", @@ -78498,8 +86792,8 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -78514,13 +86808,6 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -78530,12 +86817,11 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.045, - "output": 0.36, - "cache_read": 0.0045 + "input": 0.99, + "output": 4 }, "type": "chat" }, @@ -78595,9 +86881,9 @@ "type": "chat" }, { - "id": "openai/gpt-4-turbo", - "name": "GPT-4-Turbo", - "display_name": "GPT-4-Turbo", + "id": "openai/o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ "text", @@ -78608,62 +86894,69 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2023-09-13", - "last_updated": "2023-09-13", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 9, - "output": 27 + "input": 1.8, + "output": 7.2, + "cache_read": 0.45 }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "openai/o3-deep-research", + "name": "o3-deep-research", + "display_name": "o3-deep-research", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -78673,19 +86966,19 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "release_date": "2025-06-27", + "last_updated": "2025-06-27", "cost": { - "input": 1.6, - "output": 13, - "cache_read": 0.16 + "input": 9, + "output": 36, + "cache_read": 2.2 }, "type": "chat" }, { - "id": "openai/o3-pro", - "name": "o3-pro", - "display_name": "o3-pro", + "id": "openai/gpt-5.2-instant", + "name": "GPT-5.2-Instant", + "display_name": "GPT-5.2-Instant", "modalities": { "input": [ "text", @@ -78696,22 +86989,30 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 16384 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -78721,18 +87022,19 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-06-10", - "last_updated": "2025-06-10", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 18, - "output": 72 + "input": 1.6, + "output": 13, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "openai/o3-mini-high", - "name": "o3-mini-high", - "display_name": "o3-mini-high", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", @@ -78743,8 +87045,8 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -78759,6 +87061,13 @@ "mode": "effort", "effort": "medium", "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -78768,30 +87077,57 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.99, - "output": 4 + "input": 1.1, + "output": 9, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o-mini", - "display_name": "GPT-4o-mini", + "id": "cerebras/llama-3.3-70b-cs", + "name": "llama-3.3-70b-cs", + "display_name": "llama-3.3-70b-cs", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 124096, - "output": 4096 + "context": 8192, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-05-13", + "last_updated": "2025-05-13", + "type": "chat" + }, + { + "id": "cerebras/llama-3.1-8b-cs", + "name": "Llama-3.1-8B-CS", + "display_name": "Llama-3.1-8B-CS", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 }, "temperature": false, "tool_call": true, @@ -78800,19 +87136,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2025-05-13", + "last_updated": "2025-05-13", "cost": { - "input": 0.14, - "output": 0.54, - "cache_read": 0.068 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "openai/o4-mini-deep-research", - "name": "o4-mini-deep-research", - "display_name": "o4-mini-deep-research", + "id": "cerebras/gpt-oss-120b-cs", + "name": "GPT-OSS-120B-CS", + "display_name": "GPT-OSS-120B-CS", "modalities": { "input": [ "text" @@ -78822,8 +87157,8 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 8192 }, "temperature": false, "tool_call": true, @@ -78831,222 +87166,132 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "release_date": "2025-06-27", - "last_updated": "2025-06-27", + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "cost": { - "input": 1.8, - "output": 7.2, - "cache_read": 0.45 + "input": 0.35, + "output": 0.75 }, "type": "chat" }, { - "id": "openai/gpt-5.4-mini", - "name": "GPT-5.4-Mini", - "display_name": "GPT-5.4-Mini", + "id": "cerebras/qwen3-235b-2507-cs", + "name": "qwen3-235b-2507-cs", + "display_name": "qwen3-235b-2507-cs", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2026-03-12", - "last_updated": "2026-03-12", - "cost": { - "input": 0.68, - "output": 4, - "cache_read": 0.068 - }, + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "type": "chat" }, { - "id": "openai/dall-e-3", - "name": "DALL-E-3", - "display_name": "DALL-E-3", + "id": "cerebras/qwen3-32b-cs", + "name": "qwen3-32b-cs", + "display_name": "qwen3-32b-cs", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 800, + "context": 8192, "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2023-11-06", - "last_updated": "2023-11-06", - "type": "imageGeneration" + "release_date": "2025-05-15", + "last_updated": "2025-05-15", + "type": "chat" }, { - "id": "openai/o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "runwayml/runway-gen-4-turbo", + "name": "Runway-Gen-4-Turbo", + "display_name": "Runway-Gen-4-Turbo", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 256, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", - "cost": { - "input": 0.99, - "output": 4, - "cache_read": 0.25 - }, + "release_date": "2025-05-09", + "last_updated": "2025-05-09", "type": "chat" }, { - "id": "openai/gpt-5.4-nano", - "name": "GPT-5.4-Nano", - "display_name": "GPT-5.4-Nano", + "id": "runwayml/runway", + "name": "Runway", + "display_name": "Runway", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-11", - "last_updated": "2026-03-11", - "cost": { - "input": 0.18, - "output": 1.1, - "cache_read": 0.018 - }, + "release_date": "2024-10-11", + "last_updated": "2024-10-11", "type": "chat" }, { - "id": "openai/gpt-image-1", - "name": "GPT-Image-1", - "display_name": "GPT-Image-1", + "id": "stabilityai/stablediffusionxl", + "name": "StableDiffusionXL", + "display_name": "StableDiffusionXL", "modalities": { "input": [ "text", @@ -79057,7 +87302,7 @@ ] }, "limit": { - "context": 128000, + "context": 200, "output": 8192 }, "temperature": false, @@ -79067,69 +87312,45 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-03-31", - "last_updated": "2025-03-31", - "type": "imageGeneration" + "release_date": "2023-07-09", + "last_updated": "2023-07-09", + "type": "chat" }, { - "id": "openai/gpt-5.2-codex", - "name": "GPT-5.2-Codex", - "display_name": "GPT-5.2-Codex", + "id": "empiriolabs/deepseek-v4-flash-el", + "name": "DeepSeek-V4-Flash-EL", + "display_name": "DeepSeek-V4-Flash-EL", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 384000 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, - "open_weights": false, - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "open_weights": true, + "release_date": "2026-04-24", + "last_updated": "2026-05-02", "cost": { - "input": 1.6, - "output": 13, - "cache_read": 0.16 + "input": 0.14, + "output": 0.28 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-mini", - "name": "GPT-5.1-Codex-Mini", - "display_name": "GPT-5.1-Codex-Mini", + "id": "empiriolabs/deepseek-v4-pro-el", + "name": "DeepSeek-V4-Pro-EL", + "display_name": "DeepSeek-V4-Pro-EL", "modalities": { "input": [ "text" @@ -79139,62 +87360,40 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 384000 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2025-11-12", - "last_updated": "2025-11-12", + "open_weights": true, + "release_date": "2026-04-24", + "last_updated": "2026-05-02", "cost": { - "input": 0.22, - "output": 1.8, - "cache_read": 0.022 + "input": 1.67, + "output": 3.33 }, "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "anthropic/claude-sonnet-4.6", + "name": "Claude-Sonnet-4.6", + "display_name": "Claude-Sonnet-4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 983040, "output": 128000 }, "temperature": false, @@ -79207,125 +87406,190 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", "effort_options": [ - "none", "low", "medium", "high" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-11-12", - "last_updated": "2025-11-12", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 }, "type": "chat" }, { - "id": "openai/gpt-image-1-mini", - "name": "GPT-Image-1-Mini", - "display_name": "GPT-Image-1-Mini", + "id": "anthropic/claude-sonnet-4.5", + "name": "Claude-Sonnet-4.5", + "display_name": "Claude-Sonnet-4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 983040, + "output": 32768 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2025-08-26", - "type": "imageGeneration" + "release_date": "2025-09-26", + "last_updated": "2025-09-26", + "cost": { + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 + }, + "type": "chat" }, { - "id": "openai/o1", - "name": "o1", - "display_name": "o1", + "id": "anthropic/claude-opus-4.6", + "name": "Claude-Opus-4.6", + "display_name": "Claude-Opus-4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 983040, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, "effort": "medium", "effort_options": [ "low", "medium", "high" ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] } }, "attachment": true, "open_weights": false, - "release_date": "2024-12-18", - "last_updated": "2024-12-18", + "release_date": "2026-02-04", + "last_updated": "2026-02-04", "cost": { - "input": 14, - "output": 54 + "input": 4.3, + "output": 21, + "cache_read": 0.43, + "cache_write": 5.3 }, "type": "chat" }, { - "id": "openai/gpt-5.4-pro", - "name": "GPT-5.4-Pro", - "display_name": "GPT-5.4-Pro", + "id": "anthropic/claude-haiku-3", + "name": "Claude-Haiku-3", + "display_name": "Claude-Haiku-3", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 189096, + "output": 8192 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-03-09", + "last_updated": "2024-03-09", + "cost": { + "input": 0.21, + "output": 1.1, + "cache_read": 0.021, + "cache_write": 0.26 + }, + "type": "chat" + }, + { + "id": "anthropic/claude-opus-4.1", + "name": "Claude-Opus-4.1", + "display_name": "Claude-Opus-4.1", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 196608, + "output": 32000 }, "temperature": false, "tool_call": true, @@ -79333,52 +87597,35 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 27, - "output": 160 + "input": 13, + "output": 64, + "cache_read": 1.3, + "cache_write": 16 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo", - "name": "GPT-3.5-Turbo", - "display_name": "GPT-3.5-Turbo", + "id": "anthropic/claude-sonnet-3.5-june", + "name": "Claude-Sonnet-3.5-June", + "display_name": "Claude-Sonnet-3.5-June", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 2048 + "context": 189096, + "output": 8192 }, "temperature": false, "tool_call": true, @@ -79387,29 +87634,33 @@ }, "attachment": true, "open_weights": false, - "release_date": "2023-09-13", - "last_updated": "2023-09-13", + "release_date": "2024-11-18", + "last_updated": "2024-11-18", "cost": { - "input": 0.45, - "output": 1.4 + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 }, "type": "chat" }, { - "id": "openai/o3-deep-research", - "name": "o3-deep-research", - "display_name": "o3-deep-research", + "id": "anthropic/claude-opus-4", + "name": "Claude-Opus-4", + "display_name": "Claude-Opus-4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 192512, + "output": 28672 }, "temperature": false, "tool_call": true, @@ -79417,47 +87668,35 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "release_date": "2025-06-27", - "last_updated": "2025-06-27", + "release_date": "2025-05-21", + "last_updated": "2025-05-21", "cost": { - "input": 9, - "output": 36, - "cache_read": 2.2 + "input": 13, + "output": 64, + "cache_read": 1.3, + "cache_write": 16 }, "type": "chat" }, { - "id": "openai/o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "anthropic/claude-haiku-4.5", + "name": "Claude-Haiku-4.5", + "display_name": "Claude-Haiku-4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 192000, + "output": 64000 }, "temperature": false, "tool_call": true, @@ -79465,46 +87704,35 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.99, - "output": 4 + "input": 0.85, + "output": 4.3, + "cache_read": 0.085, + "cache_write": 1.1 }, "type": "chat" }, { - "id": "openai/o1-pro", - "name": "o1-pro", - "display_name": "o1-pro", + "id": "anthropic/claude-sonnet-3.7", + "name": "Claude-Sonnet-3.7", + "display_name": "Claude-Sonnet-3.7", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 196608, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -79512,44 +87740,34 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "release_date": "2025-03-19", - "last_updated": "2025-03-19", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 140, - "output": 540 + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 }, "type": "chat" }, { - "id": "openai/gpt-4o-search", - "name": "GPT-4o-Search", - "display_name": "GPT-4o-Search", + "id": "anthropic/claude-haiku-3.5", + "name": "Claude-Haiku-3.5", + "display_name": "Claude-Haiku-3.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 189096, "output": 8192 }, "temperature": false, @@ -79559,30 +87777,33 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-03-11", - "last_updated": "2025-03-11", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 2.2, - "output": 9 + "input": 0.68, + "output": 3.4, + "cache_read": 0.068, + "cache_write": 0.85 }, "type": "chat" }, { - "id": "openai/gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "anthropic/claude-opus-4.5", + "name": "Claude-Opus-4.5", + "display_name": "Claude-Opus-4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 196608, + "output": 64000 }, "temperature": false, "tool_call": true, @@ -79590,41 +87811,22 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "release_date": "2025-11-21", + "last_updated": "2025-11-21", "cost": { - "input": 1.1, - "output": 9 + "input": 4.3, + "output": 21, + "cache_read": 0.43, + "cache_write": 5.3 }, "type": "chat" }, { - "id": "openai/gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "anthropic/claude-sonnet-4", + "name": "Claude-Sonnet-4", + "display_name": "Claude-Sonnet-4", "modalities": { "input": [ "text", @@ -79632,121 +87834,108 @@ "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 983040, + "output": 64000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "release_date": "2025-05-21", + "last_updated": "2025-05-21", "cost": { - "input": 2.2, - "output": 14, - "cache_read": 0.22 + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 }, "type": "chat" }, { - "id": "openai/gpt-5.3-codex-spark", - "name": "GPT-5.3-Codex-Spark", - "display_name": "GPT-5.3-Codex-Spark", + "id": "anthropic/claude-opus-4.7", + "name": "Claude-Opus-4.7", + "display_name": "Claude-Opus-4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1048576, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "high", "effort_options": [ "low", "medium", "high", "xhigh" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-03-04", - "last_updated": "2026-03-04", + "release_date": "2026-04-15", + "last_updated": "2026-04-15", "cost": { - "input": 0, - "output": 0 + "input": 4.3, + "output": 21, + "cache_read": 0.43, + "cache_write": 5.4 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo-raw", - "name": "GPT-3.5-Turbo-Raw", - "display_name": "GPT-3.5-Turbo-Raw", + "id": "anthropic/claude-sonnet-3.5", + "name": "Claude-Sonnet-3.5", + "display_name": "Claude-Sonnet-3.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 4524, - "output": 2048 + "context": 189096, + "output": 8192 }, "temperature": false, "tool_call": true, @@ -79755,30 +87944,31 @@ }, "attachment": true, "open_weights": false, - "release_date": "2023-09-27", - "last_updated": "2023-09-27", + "release_date": "2024-06-05", + "last_updated": "2024-06-05", "cost": { - "input": 0.45, - "output": 1.4 + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 }, "type": "chat" }, { - "id": "openai/gpt-4.1-nano", - "name": "GPT-4.1-nano", - "display_name": "GPT-4.1-nano", + "id": "elevenlabs/elevenlabs-v3", + "name": "ElevenLabs-v3", + "display_name": "ElevenLabs-v3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 128000, + "output": 8192 }, "temperature": false, "tool_call": true, @@ -79787,147 +87977,106 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", - "cost": { - "input": 0.09, - "output": 0.36, - "cache_read": 0.022 - }, + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "type": "chat" }, { - "id": "openai/o3", - "name": "o3", - "display_name": "o3", + "id": "elevenlabs/elevenlabs-music", + "name": "ElevenLabs-Music", + "display_name": "ElevenLabs-Music", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 2000, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", - "cost": { - "input": 1.8, - "output": 7.2, - "cache_read": 0.45 - }, + "release_date": "2025-08-29", + "last_updated": "2025-08-29", "type": "chat" }, { - "id": "openai/gpt-5-pro", - "name": "GPT-5-Pro", - "display_name": "GPT-5-Pro", + "id": "elevenlabs/elevenlabs-v2.5-turbo", + "name": "ElevenLabs-v2.5-Turbo", + "display_name": "ElevenLabs-v2.5-Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-10-06", - "last_updated": "2025-10-06", - "cost": { - "input": 14, - "output": 110 - }, + "release_date": "2024-10-28", + "last_updated": "2024-10-28", "type": "chat" }, { - "id": "openai/sora-2", - "name": "Sora-2", - "display_name": "Sora-2", + "id": "novita/minimax-m2.1", + "name": "minimax-m2.1", + "display_name": "minimax-m2.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 205000, + "output": 131072 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "release_date": "2025-12-26", + "last_updated": "2025-12-26", "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "novita/kimi-k2.5", + "name": "Kimi-K2.5", + "display_name": "Kimi-K2.5", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" @@ -79935,37 +88084,53 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "cost": { + "input": 0.6, + "output": 3, + "cache_read": 0.1 + }, "type": "chat" }, { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "novita/deepseek-v3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -79973,96 +88138,52 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 + "input": 0.27, + "output": 0.4, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "openai/gpt-5.2-instant", - "name": "GPT-5.2-Instant", - "display_name": "GPT-5.2-Instant", + "id": "novita/glm-4.7-n", + "name": "glm-4.7-n", + "display_name": "glm-4.7-n", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 205000, + "output": 131072 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", - "cost": { - "input": 1.6, - "output": 13, - "cache_read": 0.16 - }, + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "type": "chat" }, { - "id": "openai/gpt-4o-mini-search", - "name": "GPT-4o-mini-Search", - "display_name": "GPT-4o-mini-Search", + "id": "novita/glm-4.7-flash", + "name": "glm-4.7-flash", + "display_name": "glm-4.7-flash", "modalities": { "input": [ "text" @@ -80072,209 +88193,225 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 65500 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "release_date": "2025-03-11", - "last_updated": "2025-03-11", - "cost": { - "input": 0.14, - "output": 0.54 - }, + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "type": "chat" }, { - "id": "openai/gpt-image-1.5", - "name": "gpt-image-1.5", - "display_name": "gpt-image-1.5", + "id": "novita/glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 128000, + "context": 8192, "output": 8192 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "release_date": "2025-12-16", - "last_updated": "2025-12-16", - "type": "imageGeneration" + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "type": "chat" }, { - "id": "openai/gpt-3.5-turbo-instruct", - "name": "GPT-3.5-Turbo-Instruct", - "display_name": "GPT-3.5-Turbo-Instruct", + "id": "novita/kimi-k2-thinking", + "name": "kimi-k2-thinking", + "display_name": "kimi-k2-thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 3500, - "output": 1024 + "context": 256000, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2023-09-20", - "last_updated": "2023-09-20", - "cost": { - "input": 1.4, - "output": 1.8 - }, + "release_date": "2025-11-07", + "last_updated": "2025-11-07", "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "novita/glm-4.7", + "name": "glm-4.7", + "display_name": "glm-4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 205000, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 1.8, - "output": 7.2, - "cache_read": 0.45 - }, + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "type": "chat" }, { - "id": "openai/gpt-5.1-instant", - "name": "GPT-5.1-Instant", - "display_name": "GPT-5.1-Instant", + "id": "novita/glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 205000, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-11-12", - "last_updated": "2025-11-12", + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1-mini", - "display_name": "GPT-4.1-mini", + "id": "novita/kimi-k2.6", + "name": "Kimi-K2.6", + "display_name": "Kimi-K2.6", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, - "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-04-20", + "last_updated": "2026-05-02", "cost": { - "input": 0.36, - "output": 1.4, - "cache_read": 0.09 + "input": 0.96, + "output": 4.04, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "openai/gpt-4-classic", - "name": "GPT-4-Classic", - "display_name": "GPT-4-Classic", + "id": "novita/glm-4.6v", + "name": "glm-4.6v", + "display_name": "glm-4.6v", "modalities": { "input": [ "text", @@ -80285,95 +88422,64 @@ ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 131000, + "output": 32768 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2024-03-25", - "last_updated": "2024-03-25", - "cost": { - "input": 27, - "output": 54 - }, + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "type": "chat" }, { - "id": "openai/gpt-5.1-codex", - "name": "GPT-5.1-Codex", - "display_name": "GPT-5.1-Codex", + "id": "google/veo-3.1-fast", + "name": "Veo-3.1-Fast", + "display_name": "Veo-3.1-Fast", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 480, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-11-12", - "last_updated": "2025-11-12", - "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 - }, + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "type": "chat" }, { - "id": "openai/gpt-5.3-instant", - "name": "GPT-5.3-Instant", - "display_name": "GPT-5.3-Instant", + "id": "google/imagen-4-fast", + "name": "Imagen-4-Fast", + "display_name": "Imagen-4-Fast", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 480, + "output": 8192 }, "temperature": false, "tool_call": true, @@ -80382,13 +88488,8 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-03-03", - "last_updated": "2026-03-03", - "cost": { - "input": 1.6, - "output": 13, - "cache_read": 0.16 - }, + "release_date": "2025-06-25", + "last_updated": "2025-06-25", "type": "chat" }, { @@ -80419,20 +88520,20 @@ "type": "chat" }, { - "id": "google/veo-3.1-fast", - "name": "Veo-3.1-Fast", - "display_name": "Veo-3.1-Fast", + "id": "google/nano-banana-pro", + "name": "Nano-Banana-Pro", + "display_name": "Nano-Banana-Pro", "modalities": { "input": [ "text", "image" ], "output": [ - "video" + "image" ] }, "limit": { - "context": 480, + "context": 65536, "output": 8192 }, "temperature": false, @@ -80442,14 +88543,19 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", + "cost": { + "input": 2, + "output": 12, + "cache_read": 0.2 + }, "type": "chat" }, { - "id": "google/gemini-3.1-pro", - "name": "Gemini-3.1-Pro", - "display_name": "Gemini-3.1-Pro", + "id": "google/gemini-3-pro", + "name": "Gemini-3-Pro", + "display_name": "Gemini-3-Pro", "modalities": { "input": [ "text", @@ -80490,46 +88596,19 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "release_date": "2025-10-22", + "last_updated": "2025-10-22", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2 - }, - "type": "chat" - }, - { - "id": "google/imagen-3-fast", - "name": "Imagen-3-Fast", - "display_name": "Imagen-3-Fast", - "modalities": { - "input": [ - "text" - ], - "output": [ - "image" - ] - }, - "limit": { - "context": 480, - "output": 8192 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": false + "input": 1.6, + "output": 9.6, + "cache_read": 0.16 }, - "attachment": true, - "open_weights": false, - "release_date": "2024-10-17", - "last_updated": "2024-10-17", "type": "chat" }, { - "id": "google/gemini-2.0-flash", - "name": "Gemini-2.0-Flash", - "display_name": "Gemini-2.0-Flash", + "id": "google/gemini-3.1-flash-lite", + "name": "Gemini-3.1-Flash-Lite", + "display_name": "Gemini-3.1-Flash-Lite", "modalities": { "input": [ "text", @@ -80542,55 +88621,61 @@ ] }, "limit": { - "context": 990000, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2026-02-18", + "last_updated": "2026-02-18", "cost": { - "input": 0.1, - "output": 0.42 + "input": 0.25, + "output": 1.5 }, "type": "chat" }, { - "id": "google/gemini-deep-research", - "name": "gemini-deep-research", - "display_name": "gemini-deep-research", + "id": "google/nano-banana", + "name": "Nano-Banana", + "display_name": "Nano-Banana", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 1048576, + "context": 65536, "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 1.6, - "output": 9.6 + "input": 0.21, + "output": 1.8, + "cache_read": 0.021 }, "type": "chat" }, @@ -80650,15 +88735,15 @@ "type": "chat" }, { - "id": "google/imagen-3", - "name": "Imagen-3", - "display_name": "Imagen-3", + "id": "google/veo-3.1", + "name": "Veo-3.1", + "display_name": "Veo-3.1", "modalities": { "input": [ "text" ], "output": [ - "image" + "video" ] }, "limit": { @@ -80672,26 +88757,24 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-10-15", - "last_updated": "2024-10-15", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "type": "chat" }, { - "id": "google/nano-banana", - "name": "Nano-Banana", - "display_name": "Nano-Banana", + "id": "google/imagen-3", + "name": "Imagen-3", + "display_name": "Imagen-3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", "image" ] }, "limit": { - "context": 65536, + "context": 480, "output": 8192 }, "temperature": false, @@ -80701,19 +88784,14 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", - "cost": { - "input": 0.21, - "output": 1.8, - "cache_read": 0.021 - }, + "release_date": "2024-10-15", + "last_updated": "2024-10-15", "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini-2.5-Flash", - "display_name": "Gemini-2.5-Flash", + "id": "google/gemini-2.5-flash-lite", + "name": "Gemini-2.5-Flash-Lite", + "display_name": "Gemini-2.5-Flash-Lite", "modalities": { "input": [ "text", @@ -80726,26 +88804,25 @@ ] }, "limit": { - "context": 1065535, - "output": 65535 + "context": 1024000, + "output": 64000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "budget", "budget": { "default": -1, - "min": 0, + "min": 512, "max": 24576, "auto": -1, - "off": 0, "unit": "tokens" }, "summaries": true, @@ -80757,19 +88834,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-04-26", - "last_updated": "2025-04-26", + "release_date": "2025-06-19", + "last_updated": "2025-06-19", "cost": { - "input": 0.21, - "output": 1.8, - "cache_read": 0.021 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-lite", - "name": "Gemini-3.1-Flash-Lite", - "display_name": "Gemini-3.1-Flash-Lite", + "id": "google/gemini-2.0-flash-lite", + "name": "Gemini-2.0-Flash-Lite", + "display_name": "Gemini-2.0-Flash-Lite", "modalities": { "input": [ "text", @@ -80782,28 +88858,49 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 990000, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-02-18", - "last_updated": "2026-02-18", + "release_date": "2025-02-05", + "last_updated": "2025-02-05", "cost": { - "input": 0.25, - "output": 1.5 + "input": 0.052, + "output": 0.21 + }, + "type": "chat" + }, + { + "id": "google/veo-3", + "name": "Veo-3", + "display_name": "Veo-3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "video" + ] + }, + "limit": { + "context": 480, + "output": 8192 }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-05-21", + "last_updated": "2025-05-21", "type": "chat" }, { @@ -80862,9 +88959,99 @@ "type": "chat" }, { - "id": "google/veo-3.1", - "name": "Veo-3.1", - "display_name": "Veo-3.1", + "id": "google/gemini-deep-research", + "name": "gemini-deep-research", + "display_name": "gemini-deep-research", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 8192 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 1.6, + "output": 9.6 + }, + "type": "chat" + }, + { + "id": "google/gemini-2.5-flash", + "name": "Gemini-2.5-Flash", + "display_name": "Gemini-2.5-Flash", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1065535, + "output": 65535 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-04-26", + "last_updated": "2025-04-26", + "cost": { + "input": 0.21, + "output": 1.8, + "cache_read": 0.021 + }, + "type": "chat" + }, + { + "id": "google/veo-2", + "name": "Veo-2", + "display_name": "Veo-2", "modalities": { "input": [ "text" @@ -80884,8 +89071,8 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2024-12-02", + "last_updated": "2024-12-02", "type": "chat" }, { @@ -80943,20 +89130,54 @@ "type": "chat" }, { - "id": "google/nano-banana-pro", - "name": "Nano-Banana-Pro", - "display_name": "Nano-Banana-Pro", + "id": "google/gemini-2.0-flash", + "name": "Gemini-2.0-Flash", + "display_name": "Gemini-2.0-Flash", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ + "text" + ] + }, + "limit": { + "context": 990000, + "output": 8192 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "cost": { + "input": 0.1, + "output": 0.42 + }, + "type": "chat" + }, + { + "id": "google/gemma-4-31b", + "name": "Gemma-4-31B", + "display_name": "Gemma-4-31B", + "modalities": { + "input": [ + "text", "image" + ], + "output": [ + "text" ] }, "limit": { - "context": 65536, + "context": 262144, "output": 8192 }, "temperature": false, @@ -80966,19 +89187,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemini-3-pro", - "name": "Gemini-3-Pro", - "display_name": "Gemini-3-Pro", + "id": "google/gemini-3.1-pro", + "name": "Gemini-3.1-Pro", + "display_name": "Gemini-3.1-Pro", "modalities": { "input": [ "text", @@ -81019,19 +89239,19 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-10-22", - "last_updated": "2025-10-22", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 1.6, - "output": 9.6, - "cache_read": 0.16 + "input": 2, + "output": 12, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "google/imagen-4-fast", - "name": "Imagen-4-Fast", - "display_name": "Imagen-4-Fast", + "id": "google/imagen-3-fast", + "name": "Imagen-3-Fast", + "display_name": "Imagen-3-Fast", "modalities": { "input": [ "text" @@ -81051,20 +89271,20 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-06-25", - "last_updated": "2025-06-25", + "release_date": "2024-10-17", + "last_updated": "2024-10-17", "type": "chat" }, { - "id": "google/veo-3", - "name": "Veo-3", - "display_name": "Veo-3", + "id": "google/imagen-4", + "name": "Imagen-4", + "display_name": "Imagen-4", "modalities": { "input": [ "text" ], "output": [ - "video" + "image" ] }, "limit": { @@ -81078,95 +89298,240 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-05-21", - "last_updated": "2025-05-21", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "type": "chat" }, { - "id": "google/gemini-2.5-flash-lite", - "name": "Gemini-2.5-Flash-Lite", - "display_name": "Gemini-2.5-Flash-Lite", + "id": "trytako/tako", + "name": "Tako", + "display_name": "Tako", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2048, + "output": 8192 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-08-15", + "last_updated": "2024-08-15", + "type": "chat" + }, + { + "id": "poetools/claude-code", + "name": "claude-code", + "display_name": "claude-code", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-27", + "last_updated": "2025-11-27", + "type": "chat" + }, + { + "id": "fireworks-ai/kimi-k2.5-fw", + "name": "Kimi-K2.5-FW", + "display_name": "Kimi-K2.5-FW", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1024000, - "output": 64000 + "context": 262144, + "output": 16384 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + }, + { + "id": "xai/grok-3-mini", + "name": "Grok 3 Mini", + "display_name": "Grok 3 Mini", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-04-11", + "last_updated": "2025-04-11", + "cost": { + "input": 0.3, + "output": 0.5, + "cache_read": 0.075 + }, + "type": "chat" + }, + { + "id": "xai/grok-4", + "name": "Grok-4", + "display_name": "Grok-4", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, "attachment": true, "open_weights": false, - "release_date": "2025-06-19", - "last_updated": "2025-06-19", + "release_date": "2025-07-10", + "last_updated": "2025-07-10", "cost": { - "input": 0.07, - "output": 0.28 + "input": 3, + "output": 15, + "cache_read": 0.75 }, "type": "chat" }, { - "id": "google/imagen-4", - "name": "Imagen-4", - "display_name": "Imagen-4", + "id": "xai/grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ "text" ], "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-22", + "last_updated": "2025-08-22", + "cost": { + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 + }, + "type": "chat" + }, + { + "id": "xai/grok-4.1-fast-reasoning", + "name": "Grok-4.1-Fast-Reasoning", + "display_name": "Grok-4.1-Fast-Reasoning", + "modalities": { + "input": [ + "text", "image" + ], + "output": [ + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 2000000, + "output": 30000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "type": "chat" }, { - "id": "google/gemma-4-31b", - "name": "Gemma-4-31B", - "display_name": "Gemma-4-31B", + "id": "xai/grok-4.1-fast-non-reasoning", + "name": "Grok-4.1-Fast-Non-Reasoning", + "display_name": "Grok-4.1-Fast-Non-Reasoning", "modalities": { "input": [ "text", @@ -81177,8 +89542,8 @@ ] }, "limit": { - "context": 262144, - "output": 8192 + "context": 2000000, + "output": 30000 }, "temperature": false, "tool_call": true, @@ -81187,31 +89552,25 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "type": "chat" }, { - "id": "google/gemini-2.0-flash-lite", - "name": "Gemini-2.0-Flash-Lite", - "display_name": "Gemini-2.0-Flash-Lite", + "id": "xai/grok-4.20-multi-agent", + "name": "Grok-4.20-Multi-Agent", + "display_name": "Grok-4.20-Multi-Agent", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 990000, + "context": 128000, "output": 8192 }, "temperature": false, @@ -81221,28 +89580,29 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2025-02-05", + "release_date": "2026-03-13", + "last_updated": "2026-03-13", "cost": { - "input": 0.052, - "output": 0.21 + "input": 2, + "output": 6, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "google/veo-2", - "name": "Veo-2", - "display_name": "Veo-2", + "id": "xai/grok-3", + "name": "Grok 3", + "display_name": "Grok 3", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 480, + "context": 131072, "output": 8192 }, "temperature": false, @@ -81252,26 +89612,31 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-12-02", - "last_updated": "2024-12-02", + "release_date": "2025-04-11", + "last_updated": "2025-04-11", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.75 + }, "type": "chat" }, { - "id": "lumalabs/ray2", - "name": "Ray2", - "display_name": "Ray2", + "id": "xai/grok-4-fast-non-reasoning", + "name": "Grok-4-Fast-Non-Reasoning", + "display_name": "Grok-4-Fast-Non-Reasoning", "modalities": { "input": [ "text", "image" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 5000, - "output": 8192 + "context": 2000000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -81280,27 +89645,31 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-02-20", - "last_updated": "2025-02-20", + "release_date": "2025-09-16", + "last_updated": "2025-09-16", + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.1", - "name": "Claude-Opus-4.1", - "display_name": "Claude-Opus-4.1", + "id": "xai/grok-4-fast-reasoning", + "name": "Grok-4-Fast-Reasoning", + "display_name": "Grok-4-Fast-Reasoning", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 32000 + "context": 2000000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -81308,34 +89677,64 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-09-16", + "last_updated": "2025-09-16", "cost": { - "input": 13, - "output": 64, - "cache_read": 1.3, - "cache_write": 16 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + }, + "type": "chat" + }, + { + "id": "lumalabs/ray2", + "name": "Ray2", + "display_name": "Ray2", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "video" + ] + }, + "limit": { + "context": 5000, + "output": 8192 }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-02-20", + "last_updated": "2025-02-20", "type": "chat" }, { - "id": "anthropic/claude-sonnet-3.5", - "name": "Claude-Sonnet-3.5", - "display_name": "Claude-Sonnet-3.5", + "id": "topazlabs-co/topazlabs", + "name": "TopazLabs", + "display_name": "TopazLabs", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 189096, + "context": 204, "output": 8192 }, "temperature": false, @@ -81345,290 +89744,328 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-06-05", - "last_updated": "2024-06-05", - "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 - }, + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "type": "chat" }, { - "id": "anthropic/claude-haiku-3", - "name": "Claude-Haiku-3", - "display_name": "Claude-Haiku-3", + "id": "openai/gpt-5.5-pro", + "name": "GPT-5.5-Pro", + "display_name": "GPT-5.5-Pro", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 189096, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "release_date": "2024-03-09", - "last_updated": "2024-03-09", + "knowledge": "2025-12-01", + "release_date": "2026-04-08", + "last_updated": "2026-04-08", "cost": { - "input": 0.21, - "output": 1.1, - "cache_read": 0.021, - "cache_write": 0.26 + "input": 27.2727, + "output": 163.6364 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6", - "name": "Claude-Opus-4.6", - "display_name": "Claude-Opus-4.6", + "id": "openai/gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 983040, + "context": 400000, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, + "default_enabled": true, + "mode": "effort", "effort": "medium", "effort_options": [ "low", "medium", - "high" + "high", + "xhigh" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-04", - "last_updated": "2026-02-04", + "knowledge": "2025-12-01", + "release_date": "2026-04-08", + "last_updated": "2026-04-08", "cost": { - "input": 4.3, - "output": 21, - "cache_read": 0.43, - "cache_write": 5.3 + "input": 4.5455, + "output": 27.2727, + "cache_read": 0.4545 + }, + "type": "chat" + } + ] + }, + "minimax": { + "id": "minimax", + "name": "MiniMax (minimax.io)", + "display_name": "MiniMax (minimax.io)", + "api": "https://api.minimax.io/anthropic/v1", + "doc": "https://platform.minimax.io/docs/guides/quickstart", + "models": [ + { + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "cost": { + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.7", - "name": "Claude-Opus-4.7", - "display_name": "Claude-Opus-4.7", + "id": "MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], "interleaved": true, "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-15", - "last_updated": "2026-04-15", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 4.3, - "output": 21, - "cache_read": 0.43, - "cache_write": 5.4 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude-Sonnet-4", - "display_name": "Claude-Sonnet-4", + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 983040, - "output": 64000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-21", - "last_updated": "2025-05-21", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.5", - "name": "Claude-Sonnet-4.5", - "display_name": "Claude-Sonnet-4.5", + "id": "MiniMax-M2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 983040, - "output": 32768 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-26", - "last_updated": "2025-09-26", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.5", - "name": "Claude-Opus-4.5", - "display_name": "Claude-Opus-4.5", + "id": "MiniMax-M2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "display_name": "MiniMax-M2.5-highspeed", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 64000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-21", - "last_updated": "2025-11-21", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", "cost": { - "input": 4.3, - "output": 21, - "cache_read": 0.43, - "cache_write": 5.3 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-3.7", - "name": "Claude-Sonnet-3.7", - "display_name": "Claude-Sonnet-3.7", + "id": "MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -81638,342 +90075,334 @@ "context": 196608, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 + "input": 0.3, + "output": 1.2 }, "type": "chat" - }, + } + ] + }, + "groq": { + "id": "groq", + "name": "Groq", + "display_name": "Groq", + "doc": "https://console.groq.com/docs/models", + "models": [ { - "id": "anthropic/claude-opus-4", - "name": "Claude-Opus-4", - "display_name": "Claude-Opus-4", + "id": "gemma2-9b-it", + "name": "Gemma 2 9B", + "display_name": "Gemma 2 9B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 192512, - "output": 28672 + "context": 8192, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-21", - "last_updated": "2025-05-21", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2024-06-27", + "last_updated": "2024-06-27", "cost": { - "input": 13, - "output": 64, - "cache_read": 1.3, - "cache_write": 16 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-3.5", - "name": "Claude-Haiku-3.5", - "display_name": "Claude-Haiku-3.5", + "id": "llama-3.1-8b-instant", + "name": "Llama 3.1 8B Instant", + "display_name": "Llama 3.1 8B Instant", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 189096, - "output": 8192 + "context": 131072, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.68, - "output": 3.4, - "cache_read": 0.068, - "cache_write": 0.85 + "input": 0.05, + "output": 0.08 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4.5", - "name": "Claude-Haiku-4.5", - "display_name": "Claude-Haiku-4.5", + "id": "llama3-8b-8192", + "name": "Llama 3 8B", + "display_name": "Llama 3 8B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 192000, - "output": 64000 + "context": 8192, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-03", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 0.85, - "output": 4.3, - "cache_read": 0.085, - "cache_write": 1.1 + "input": 0.05, + "output": 0.08 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-3.5-june", - "name": "Claude-Sonnet-3.5-June", - "display_name": "Claude-Sonnet-3.5-June", + "id": "allam-2-7b", + "name": "ALLaM-2-7b", + "display_name": "ALLaM-2-7b", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 189096, - "output": 8192 + "context": 4096, + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-11-18", - "last_updated": "2024-11-18", + "knowledge": "2024-09", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.6", - "name": "Claude-Sonnet-4.6", - "display_name": "Claude-Sonnet-4.6", + "id": "mistral-saba-24b", + "name": "Mistral Saba 24B", + "display_name": "Mistral Saba 24B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 983040, - "output": 128000 + "context": 32768, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2024-08", + "release_date": "2025-02-06", + "last_updated": "2025-02-06", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 + "input": 0.79, + "output": 0.79 }, "type": "chat" }, { - "id": "ideogramai/ideogram", - "name": "Ideogram", - "display_name": "Ideogram", + "id": "qwen-qwq-32b", + "name": "Qwen QwQ 32B", + "display_name": "Qwen QwQ 32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 150, - "output": 8192 + "context": 131072, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-09", + "release_date": "2024-11-27", + "last_updated": "2024-11-27", + "cost": { + "input": 0.29, + "output": 0.39 }, - "attachment": true, - "open_weights": false, - "release_date": "2024-04-03", - "last_updated": "2024-04-03", "type": "chat" }, { - "id": "ideogramai/ideogram-v2", - "name": "Ideogram-v2", - "display_name": "Ideogram-v2", + "id": "llama-3.3-70b-versatile", + "name": "Llama 3.3 70B Versatile", + "display_name": "Llama 3.3 70B Versatile", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 150, - "output": 8192 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-08-21", - "last_updated": "2024-08-21", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.59, + "output": 0.79 + }, "type": "chat" }, { - "id": "ideogramai/ideogram-v2a-turbo", - "name": "Ideogram-v2a-Turbo", - "display_name": "Ideogram-v2a-Turbo", + "id": "whisper-large-v3", + "name": "Whisper Large V3", + "display_name": "Whisper Large V3", "modalities": { "input": [ - "text" + "audio" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 150, - "output": 8192 + "context": 448, + "output": 448 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27", + "attachment": false, + "open_weights": true, + "knowledge": "2023-09", + "release_date": "2023-09-01", + "last_updated": "2025-09-05", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "ideogramai/ideogram-v2a", - "name": "Ideogram-v2a", - "display_name": "Ideogram-v2a", + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 150, + "context": 131072, "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "cost": { + "input": 0.75, + "output": 0.99 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27", "type": "chat" }, { - "id": "trytako/tako", - "name": "Tako", - "display_name": "Tako", + "id": "llama-guard-3-8b", + "name": "Llama Guard 3 8B", + "display_name": "Llama Guard 3 8B", "modalities": { "input": [ "text" @@ -81983,24 +90412,28 @@ ] }, "limit": { - "context": 2048, + "context": 8192, "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0.2, + "output": 0.2 + }, "type": "chat" }, { - "id": "poetools/claude-code", - "name": "claude-code", - "display_name": "claude-code", + "id": "llama3-70b-8192", + "name": "Llama 3 70B", + "display_name": "Llama 3 70B", "modalities": { "input": [ "text" @@ -82013,168 +90446,133 @@ "context": 8192, "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-03", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", + "cost": { + "input": 0.59, + "output": 0.79 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-27", - "last_updated": "2025-11-27", "type": "chat" }, { - "id": "openai/gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "whisper-large-v3-turbo", + "name": "Whisper Large v3 Turbo", + "display_name": "Whisper Large v3 Turbo", "modalities": { "input": [ - "text", - "image" + "audio" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 448, + "output": 448 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 4.5455, - "output": 27.2727, - "cache_read": 0.4545 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-5.5-pro", - "name": "GPT-5.5-Pro", - "display_name": "GPT-5.5-Pro", + "id": "moonshotai/kimi-k2-instruct-0905", + "name": "Kimi K2 Instruct 0905", + "display_name": "Kimi K2 Instruct 0905", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 27.2727, - "output": 163.6364 + "input": 1, + "output": 3 }, "type": "chat" - } - ] - }, - "helicone": { - "id": "helicone", - "name": "Helicone", - "display_name": "Helicone", - "api": "https://ai-gateway.helicone.ai/v1", - "doc": "https://helicone.ai/models", - "models": [ + }, { - "id": "mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "moonshotai/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16400 + "context": 131072, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", "cost": { - "input": 20, - "output": 40 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "grok-4-1-fast-reasoning", - "name": "xAI Grok 4.1 Fast Reasoning", - "display_name": "xAI Grok 4.1 Fast Reasoning", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -82188,21 +90586,19 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-17", - "last_updated": "2025-11-17", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.19999999999999998, - "output": 0.5, - "cache_read": 0.049999999999999996 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "gemma2-9b-it", - "name": "Google Gemma 2", - "display_name": "Google Gemma 2", + "id": "openai/gpt-oss-safeguard-20b", + "name": "Safety GPT OSS 20B", + "display_name": "Safety GPT OSS 20B", "modalities": { "input": [ "text" @@ -82212,29 +90608,30 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-25", - "last_updated": "2024-06-25", + "open_weights": true, + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "cost": { - "input": 0.01, - "output": 0.03 + "input": 0.075, + "output": 0.3, + "cache_read": 0.037 }, "type": "chat" }, { - "id": "llama-3.3-70b-instruct", - "name": "Meta Llama 3.3 70B Instruct", - "display_name": "Meta Llama 3.3 70B Instruct", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -82244,33 +90641,37 @@ ] }, "limit": { - "context": 128000, - "output": 16400 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.13, - "output": 0.39 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "llama-4-scout", - "name": "Meta Llama 4 Scout 17B 16E", - "display_name": "Meta Llama 4 Scout 17B 16E", + "id": "groq/compound", + "name": "Compound", + "display_name": "Compound", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -82283,180 +90684,165 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-09-04", + "release_date": "2025-09-04", + "last_updated": "2025-09-04", "cost": { - "input": 0.08, - "output": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "chatgpt-4o-latest", - "name": "OpenAI ChatGPT-4o", - "display_name": "OpenAI ChatGPT-4o", + "id": "groq/compound-mini", + "name": "Compound Mini", + "display_name": "Compound Mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-14", - "last_updated": "2024-08-14", + "knowledge": "2025-09-04", + "release_date": "2025-09-04", + "last_updated": "2025-09-04", "cost": { - "input": 5, - "output": 20, - "cache_read": 2.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-3.5-sonnet-v2", - "name": "Anthropic: Claude 3.5 Sonnet v2", - "display_name": "Anthropic: Claude 3.5 Sonnet v2", + "id": "canopylabs/orpheus-arabic-saudi", + "name": "Orpheus Arabic Saudi", + "display_name": "Orpheus Arabic Saudi", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 4000, + "output": 50000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2025-12-16", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.30000000000000004, - "cache_write": 3.75 + "input": 40, + "output": 0 }, "type": "chat" }, - { - "id": "hermes-2-pro-llama-3-8b", - "name": "Hermes 2 Pro Llama 3 8B", - "display_name": "Hermes 2 Pro Llama 3 8B", + { + "id": "canopylabs/orpheus-v1-english", + "name": "Orpheus V1 English", + "display_name": "Orpheus V1 English", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 4000, + "output": 50000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-05-27", - "last_updated": "2024-05-27", + "knowledge": "2025-12-19", + "release_date": "2025-12-19", + "last_updated": "2025-12-19", "cost": { - "input": 0.14, - "output": 0.14 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-3.7-sonnet", - "name": "Anthropic: Claude 3.7 Sonnet", - "display_name": "Anthropic: Claude 3.7 Sonnet", + "id": "qwen/qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 40960 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", + "interleaved": true, + "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-02", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "open_weights": true, + "knowledge": "2024-11-08", + "release_date": "2024-12-23", + "last_updated": "2024-12-23", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.30000000000000004, - "cache_write": 3.75 + "input": 0.29, + "output": 0.59 }, "type": "chat" }, { - "id": "llama-prompt-guard-2-22m", - "name": "Meta Llama Prompt Guard 2 22M", - "display_name": "Meta Llama Prompt Guard 2 22M", + "id": "meta-llama/llama-prompt-guard-2-22m", + "name": "Llama Prompt Guard 2 22M", + "display_name": "Llama Prompt Guard 2 22M", "modalities": { "input": [ "text" @@ -82467,7 +90853,7 @@ }, "limit": { "context": 512, - "output": 2 + "output": 512 }, "temperature": true, "tool_call": false, @@ -82475,143 +90861,122 @@ "supported": false }, "attachment": false, - "open_weights": false, + "open_weights": true, "knowledge": "2024-10", "release_date": "2024-10-01", "last_updated": "2024-10-01", "cost": { - "input": 0.01, - "output": 0.01 + "input": 0.03, + "output": 0.03 }, "type": "chat" }, { - "id": "o1-mini", - "name": "OpenAI: o1-mini", - "display_name": "OpenAI: o1-mini", + "id": "meta-llama/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B", + "display_name": "Llama 4 Scout 17B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 131072, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.11, + "output": 0.34 }, "type": "chat" }, { - "id": "gpt-4.1-mini-2025-04-14", - "name": "OpenAI GPT-4.1 Mini", - "display_name": "OpenAI GPT-4.1 Mini", + "id": "meta-llama/llama-prompt-guard-2-86m", + "name": "Llama Prompt Guard 2 86M", + "display_name": "Llama Prompt Guard 2 86M", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 512, + "output": 512 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 0.39999999999999997, - "output": 1.5999999999999999, - "cache_read": 0.09999999999999999 + "input": 0.04, + "output": 0.04 }, "type": "chat" }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "meta-llama/llama-4-maverick-17b-128e-instruct", + "name": "Llama 4 Maverick 17B", + "display_name": "Llama 4 Maverick 17B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.03, - "output": 0.13 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "meta-llama/llama-guard-4-12b", + "name": "Llama Guard 4 12B", + "display_name": "Llama Guard 4 12B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -82619,86 +90984,82 @@ }, "limit": { "context": 131072, - "output": 40960 + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.29, - "output": 0.59 + "input": 0.2, + "output": 0.2 }, "type": "chat" - }, + } + ] + }, + "xiaomi-token-plan-sgp": { + "id": "xiaomi-token-plan-sgp", + "name": "Xiaomi Token Plan (Singapore)", + "display_name": "Xiaomi Token Plan (Singapore)", + "api": "https://token-plan-sgp.xiaomimimo.com/v1", + "doc": "https://platform.xiaomimimo.com/#/docs", + "models": [ { - "id": "llama-3.3-70b-versatile", - "name": "Meta Llama 3.3 70B Versatile", - "display_name": "Meta Llama 3.3 70B Versatile", + "id": "mimo-v2-tts", + "name": "MiMo-V2-TTS", + "display_name": "MiMo-V2-TTS", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 131072, - "output": 32678 + "context": 8192, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.59, - "output": 0.7899999999999999 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "OpenAI GPT-5 Mini", - "display_name": "OpenAI GPT-5 Mini", + "id": "mimo-v2.5", + "name": "MiMo-V2.5", + "display_name": "MiMo-V2.5", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -82707,54 +91068,43 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.024999999999999998 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "gpt-5-nano", - "name": "OpenAI GPT-5 Nano", - "display_name": "OpenAI GPT-5 Nano", + "id": "mimo-v2-pro", + "name": "MiMo-V2-Pro", + "display_name": "MiMo-V2-Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -82763,53 +91113,40 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.049999999999999996, - "output": 0.39999999999999997, - "cache_read": 0.005 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "gemini-3-pro-preview", - "name": "Google Gemini 3 Pro Preview", - "display_name": "Google Gemini 3 Pro Preview", + "id": "mimo-v2-flash", + "name": "MiMo-V2-Flash", + "display_name": "MiMo-V2-Flash", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, @@ -82821,116 +91158,90 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "open_weights": true, + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.19999999999999998 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "claude-3-haiku-20240307", - "name": "Anthropic: Claude 3 Haiku", - "display_name": "Anthropic: Claude 3 Haiku", + "id": "mimo-v2.5-pro", + "name": "MiMo-V2.5-Pro", + "display_name": "MiMo-V2.5-Pro", "modalities": { "input": [ - "text", - "image" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 200000, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-03-07", - "last_updated": "2024-03-07", - "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 - }, - "type": "chat" - }, - { - "id": "llama-4-maverick", - "name": "Meta Llama 4 Maverick 17B 128E", - "display_name": "Meta Llama 4 Maverick 17B 128E", - "modalities": { - "input": [ - "text", - "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Anthropic: Claude Sonnet 4.5 (20250929)", - "display_name": "Anthropic: Claude Sonnet 4.5 (20250929)", + "id": "mimo-v2-omni", + "name": "MiMo-V2-Omni", + "display_name": "MiMo-V2-Omni", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -82938,35 +91249,53 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.30000000000000004, - "cache_write": 3.75 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" - }, + } + ] + }, + "siliconflow-com": { + "id": "siliconflow-com", + "name": "SiliconFlow", + "display_name": "SiliconFlow", + "api": "https://api.siliconflow.com/v1", + "doc": "https://cloud.siliconflow.com/models", + "models": [ { - "id": "gemini-2.5-pro", - "name": "Google Gemini 2.5 Pro", - "display_name": "Google Gemini 2.5 Pro", + "id": "deepseek-ai/DeepSeek-R1", + "name": "deepseek-ai/DeepSeek-R1", + "display_name": "deepseek-ai/DeepSeek-R1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, @@ -82977,51 +91306,39 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "release_date": "2025-05-28", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.3125, - "cache_write": 1.25 + "input": 0.5, + "output": 2.18 }, "type": "chat" }, { - "id": "claude-4.5-opus", - "name": "Anthropic: Claude Opus 4.5", - "display_name": "Anthropic: Claude Opus 4.5", + "id": "deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "deepseek-ai/DeepSeek-V3.1-Terminus", + "display_name": "deepseek-ai/DeepSeek-V3.1-Terminus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, @@ -83031,56 +91348,50 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "release_date": "2025-09-29", + "last_updated": "2025-11-25", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "xAI Grok 4.1 Fast Non-Reasoning", - "display_name": "xAI Grok 4.1 Fast Non-Reasoning", + "id": "deepseek-ai/DeepSeek-V3.1", + "name": "deepseek-ai/DeepSeek-V3.1", + "display_name": "deepseek-ai/DeepSeek-V3.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-17", - "last_updated": "2025-11-17", + "release_date": "2025-08-25", + "last_updated": "2025-11-25", "cost": { - "input": 0.19999999999999998, - "output": 0.5, - "cache_read": 0.049999999999999996 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "sonar-pro", - "name": "Perplexity Sonar Pro", - "display_name": "Perplexity Sonar Pro", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", "modalities": { "input": [ "text" @@ -83090,29 +91401,29 @@ ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 131000, + "output": 131000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2025-01-27", + "release_date": "2025-01-20", + "last_updated": "2025-11-25", "cost": { - "input": 3, - "output": 15 + "input": 0.18, + "output": 0.18 }, "type": "chat" }, { - "id": "mistral-large-2411", - "name": "Mistral-Large", - "display_name": "Mistral-Large", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", "modalities": { "input": [ "text" @@ -83122,89 +91433,72 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-24", - "last_updated": "2024-07-24", + "release_date": "2025-01-20", + "last_updated": "2025-11-25", "cost": { - "input": 2, - "output": 6 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "o3-pro", - "name": "OpenAI o3 Pro", - "display_name": "OpenAI o3 Pro", + "id": "deepseek-ai/DeepSeek-V3.2-Exp", + "name": "deepseek-ai/DeepSeek-V3.2-Exp", + "display_name": "deepseek-ai/DeepSeek-V3.2-Exp", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 164000, + "output": 164000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2025-10-10", + "last_updated": "2025-11-25", "cost": { - "input": 20, - "output": 80 + "input": 0.27, + "output": 0.41 }, "type": "chat" }, { - "id": "claude-opus-4-1", - "name": "Anthropic: Claude Opus 4.1", - "display_name": "Anthropic: Claude Opus 4.1", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "deepseek-ai/DeepSeek-V3.2", + "display_name": "deepseek-ai/DeepSeek-V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, @@ -83219,33 +91513,29 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-08", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-12-03", + "last_updated": "2025-12-03", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.27, + "output": 0.42 }, "type": "chat" }, { - "id": "gpt-4o-mini", - "name": "OpenAI GPT-4o-mini", - "display_name": "OpenAI GPT-4o-mini", + "id": "deepseek-ai/DeepSeek-V3", + "name": "deepseek-ai/DeepSeek-V3", + "display_name": "deepseek-ai/DeepSeek-V3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, @@ -83254,20 +91544,18 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2024-12-26", + "last_updated": "2025-11-25", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "claude-4.5-haiku", - "name": "Anthropic: Claude 4.5 Haiku", - "display_name": "Anthropic: Claude 4.5 Haiku", + "id": "deepseek-ai/deepseek-vl2", + "name": "deepseek-ai/deepseek-vl2", + "display_name": "deepseek-ai/deepseek-vl2", "modalities": { "input": [ "text", @@ -83278,31 +91566,28 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 4000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-10", - "release_date": "2025-10-01", - "last_updated": "2025-10-01", + "release_date": "2024-12-13", + "last_updated": "2025-11-25", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.09999999999999999, - "cache_write": 1.25 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "kimi-k2-0711", - "name": "Kimi K2 (07/11)", - "display_name": "Kimi K2 (07/11)", + "id": "moonshotai/Kimi-K2-Instruct", + "name": "moonshotai/Kimi-K2-Instruct", + "display_name": "moonshotai/Kimi-K2-Instruct", "modalities": { "input": [ "text" @@ -83312,8 +91597,8 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -83322,33 +91607,31 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-07-13", + "last_updated": "2025-11-25", "cost": { - "input": 0.5700000000000001, - "output": 2.3 + "input": 0.58, + "output": 2.29 }, "type": "chat" }, { - "id": "o4-mini", - "name": "OpenAI o4 Mini", - "display_name": "OpenAI o4 Mini", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "moonshotai/Kimi-K2-Thinking", + "display_name": "moonshotai/Kimi-K2-Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -83357,99 +91640,73 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2025-11-07", + "last_updated": "2025-11-25", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.275 + "input": 0.55, + "output": 2.5 }, "type": "chat" }, { - "id": "sonar-deep-research", - "name": "Perplexity Sonar Deep Research", - "display_name": "Perplexity Sonar Deep Research", + "id": "moonshotai/Kimi-K2.6", + "name": "moonshotai/Kimi-K2.6", + "display_name": "moonshotai/Kimi-K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 127000, - "output": 4096 + "context": 262000, + "output": 262000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2025-01-27", - "cost": { - "input": 2, - "output": 8 - }, - "type": "chat" - }, - { - "id": "gemma-3-12b-it", - "name": "Google Gemma 3 12B", - "display_name": "Google Gemma 3 12B", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.049999999999999996, - "output": 0.09999999999999999 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Google Gemini 2.5 Flash", - "display_name": "Google Gemini 2.5 Flash", + "id": "moonshotai/Kimi-K2.5", + "name": "moonshotai/Kimi-K2.5", + "display_name": "moonshotai/Kimi-K2.5", "modalities": { "input": [ "text", @@ -83460,8 +91717,8 @@ ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -83472,40 +91729,28 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.3 + "input": 0.45, + "output": 2.25 }, "type": "chat" }, { - "id": "deepseek-tng-r1t2-chimera", - "name": "DeepSeek TNG R1T2 Chimera", - "display_name": "DeepSeek TNG R1T2 Chimera", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "moonshotai/Kimi-K2-Instruct-0905", + "display_name": "moonshotai/Kimi-K2-Instruct-0905", "modalities": { "input": [ "text" @@ -83515,8 +91760,8 @@ ] }, "limit": { - "context": 130000, - "output": 163840 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -83525,88 +91770,65 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-02", - "last_updated": "2025-07-02", + "release_date": "2025-09-08", + "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "gpt-5.1-codex-mini", - "name": "OpenAI: GPT-5.1 Codex Mini", - "display_name": "OpenAI: GPT-5.1 Codex Mini", + "id": "openai/gpt-oss-20b", + "name": "openai/gpt-oss-20b", + "display_name": "openai/gpt-oss-20b", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131000, + "output": 8000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-08-13", + "last_updated": "2025-11-25", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.024999999999999998 + "input": 0.04, + "output": 0.18 }, "type": "chat" }, { - "id": "claude-sonnet-4", - "name": "Anthropic: Claude Sonnet 4", - "display_name": "Anthropic: Claude Sonnet 4", + "id": "openai/gpt-oss-120b", + "name": "openai/gpt-oss-120b", + "display_name": "openai/gpt-oss-120b", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131000, + "output": 8000 }, "temperature": true, "tool_call": true, @@ -83614,23 +91836,25 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-14", - "last_updated": "2025-05-14", + "release_date": "2025-08-13", + "last_updated": "2025-11-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.30000000000000004, - "cache_write": 3.75 + "input": 0.05, + "output": 0.45 }, "type": "chat" }, { - "id": "grok-code-fast-1", - "name": "xAI Grok Code Fast 1", - "display_name": "xAI Grok Code Fast 1", + "id": "zai-org/GLM-4.5-Air", + "name": "zai-org/GLM-4.5-Air", + "display_name": "zai-org/GLM-4.5-Air", "modalities": { "input": [ "text" @@ -83640,92 +91864,59 @@ ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-25", - "last_updated": "2024-08-25", + "release_date": "2025-07-28", + "last_updated": "2025-11-25", "cost": { - "input": 0.19999999999999998, - "output": 1.5, - "cache_read": 0.02 + "input": 0.14, + "output": 0.86 }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "OpenAI GPT-5.1", - "display_name": "OpenAI GPT-5.1", + "id": "zai-org/GLM-4.5", + "name": "zai-org/GLM-4.5", + "display_name": "zai-org/GLM-4.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131000, + "output": 131000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-07-28", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "deepseek-reasoner", - "name": "DeepSeek Reasoner", - "display_name": "DeepSeek Reasoner", + "id": "zai-org/GLM-4.7", + "name": "zai-org/GLM-4.7", + "display_name": "zai-org/GLM-4.7", "modalities": { "input": [ "text" @@ -83735,13 +91926,14 @@ ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 205000, + "output": 205000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -83756,20 +91948,18 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.56, - "output": 1.68, - "cache_read": 0.07 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "grok-4-fast-reasoning", - "name": "xAI: Grok 4 Fast Reasoning", - "display_name": "xAI: Grok 4 Fast Reasoning", + "id": "zai-org/GLM-4.5V", + "name": "zai-org/GLM-4.5V", + "display_name": "zai-org/GLM-4.5V", "modalities": { "input": [ "text", @@ -83780,36 +91970,28 @@ ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 66000, + "output": 66000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-01", - "last_updated": "2025-09-01", + "release_date": "2025-08-13", + "last_updated": "2025-11-25", "cost": { - "input": 0.19999999999999998, - "output": 0.5, - "cache_read": 0.049999999999999996 + "input": 0.14, + "output": 0.86 }, "type": "chat" }, { - "id": "o1", - "name": "OpenAI: o1", - "display_name": "OpenAI: o1", + "id": "zai-org/GLM-5", + "name": "zai-org/GLM-5", + "display_name": "zai-org/GLM-5", "modalities": { "input": [ "text" @@ -83819,11 +92001,11 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 205000, + "output": 205000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -83831,33 +92013,28 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 1, + "output": 3.2 }, "type": "chat" }, { - "id": "llama-3.1-8b-instant", - "name": "Meta Llama 3.1 8B Instant", - "display_name": "Meta Llama 3.1 8B Instant", + "id": "zai-org/GLM-5.1", + "name": "zai-org/GLM-5.1", + "display_name": "zai-org/GLM-5.1", "modalities": { "input": [ "text" @@ -83867,29 +92044,41 @@ ] }, "limit": { - "context": 131072, - "output": 32678 + "context": 205000, + "output": 205000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "open_weights": true, + "release_date": "2026-04-08", + "last_updated": "2026-04-08", "cost": { - "input": 0.049999999999999996, - "output": 0.08 + "input": 1.4, + "output": 4.4, + "cache_write": 0 }, "type": "chat" }, { - "id": "o3-mini", - "name": "OpenAI o3 Mini", - "display_name": "OpenAI o3 Mini", + "id": "zai-org/GLM-4.6", + "name": "zai-org/GLM-4.6", + "display_name": "zai-org/GLM-4.6", "modalities": { "input": [ "text" @@ -83899,187 +92088,174 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 205000, + "output": 205000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": false, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2023-10-01", - "last_updated": "2023-10-01", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.5, + "output": 1.9 }, "type": "chat" }, { - "id": "sonar", - "name": "Perplexity Sonar", - "display_name": "Perplexity Sonar", + "id": "zai-org/GLM-5V-Turbo", + "name": "zai-org/GLM-5V-Turbo", + "display_name": "zai-org/GLM-5V-Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 127000, - "output": 4096 + "context": 200000, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2025-01-27", + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 1, - "output": 1 + "input": 1.2, + "output": 4, + "cache_write": 0 }, "type": "chat" }, { - "id": "kimi-k2-0905", - "name": "Kimi K2 (09/05)", - "display_name": "Kimi K2 (09/05)", + "id": "zai-org/GLM-4.6V", + "name": "zai-org/GLM-4.6V", + "display_name": "zai-org/GLM-4.6V", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "release_date": "2025-12-07", + "last_updated": "2025-12-07", "cost": { - "input": 0.5, - "output": 2, - "cache_read": 0.39999999999999997 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "mistral-small", - "name": "Mistral Small", - "display_name": "Mistral Small", + "id": "THUDM/GLM-4-32B-0414", + "name": "THUDM/GLM-4-32B-0414", + "display_name": "THUDM/GLM-4-32B-0414", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 33000, + "output": 33000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-02", - "release_date": "2024-02-26", - "last_updated": "2024-02-26", + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 75, - "output": 200 + "input": 0.27, + "output": 0.27 }, "type": "chat" }, { - "id": "qwen3-30b-a3b", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "THUDM/GLM-Z1-32B-0414", + "name": "THUDM/GLM-Z1-32B-0414", + "display_name": "THUDM/GLM-Z1-32B-0414", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 41000, - "output": 41000 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.08, - "output": 0.29 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "grok-4", - "name": "xAI Grok 4", - "display_name": "xAI Grok 4", + "id": "THUDM/GLM-4-9B-0414", + "name": "THUDM/GLM-4-9B-0414", + "display_name": "THUDM/GLM-4-9B-0414", "modalities": { "input": [ "text" @@ -84089,81 +92265,60 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 33000, + "output": 33000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-09", - "last_updated": "2024-07-09", + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0.086, + "output": 0.086 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking", - "name": "Qwen3 235B A22B Thinking", - "display_name": "Qwen3 235B A22B Thinking", + "id": "THUDM/GLM-Z1-9B-0414", + "name": "THUDM/GLM-Z1-9B-0414", + "display_name": "THUDM/GLM-Z1-9B-0414", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 81920 + "context": 131000, + "output": 131000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 2.9000000000000004 + "input": 0.086, + "output": 0.086 }, "type": "chat" }, { - "id": "qwen2.5-coder-7b-fast", - "name": "Qwen2.5 Coder 7B fast", - "display_name": "Qwen2.5 Coder 7B fast", + "id": "tencent/Hunyuan-A13B-Instruct", + "name": "tencent/Hunyuan-A13B-Instruct", + "display_name": "tencent/Hunyuan-A13B-Instruct", "modalities": { "input": [ "text" @@ -84173,29 +92328,28 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 131000, + "output": 131000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-09-15", - "last_updated": "2024-09-15", + "release_date": "2025-06-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.03, - "output": 0.09 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "llama-3.1-8b-instruct-turbo", - "name": "Meta Llama 3.1 8B Instruct Turbo", - "display_name": "Meta Llama 3.1 8B Instruct Turbo", + "id": "tencent/Hunyuan-MT-7B", + "name": "tencent/Hunyuan-MT-7B", + "display_name": "tencent/Hunyuan-MT-7B", "modalities": { "input": [ "text" @@ -84205,8 +92359,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 33000, + "output": 33000 }, "temperature": true, "tool_call": true, @@ -84215,53 +92369,50 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.02, - "output": 0.03 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "nex-agi/DeepSeek-V3.1-Nex-N1", + "name": "nex-agi/DeepSeek-V3.1-Nex-N1", + "display_name": "nex-agi/DeepSeek-V3.1-Nex-N1", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 16384 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "last_updated": "2025-11-25", "cost": { - "input": 0.14, - "output": 1.4 + "input": 0.5, + "output": 2 }, "type": "chat" }, { - "id": "glm-4.6", - "name": "Zai GLM-4.6", - "display_name": "Zai GLM-4.6", + "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", + "name": "meta-llama/Meta-Llama-3.1-8B-Instruct", + "display_name": "meta-llama/Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" @@ -84271,35 +92422,28 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 33000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2025-04-23", + "last_updated": "2025-11-25", "cost": { - "input": 0.44999999999999996, - "output": 1.5 + "input": 0.06, + "output": 0.06 }, "type": "chat" }, { - "id": "gpt-5-codex", - "name": "OpenAI: GPT-5 Codex", - "display_name": "OpenAI: GPT-5 Codex", + "id": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", "modalities": { "input": [ "text" @@ -84309,135 +92453,116 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-09-04", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 + "input": 0.21, + "output": 0.57 }, "type": "chat" }, { - "id": "claude-opus-4-1-20250805", - "name": "Anthropic: Claude Opus 4.1 (20250805)", - "display_name": "Anthropic: Claude Opus 4.1 (20250805)", + "id": "MiniMaxAI/MiniMax-M2.1", + "name": "MiniMaxAI/MiniMax-M2.1", + "display_name": "MiniMaxAI/MiniMax-M2.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 197000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "knowledge": "2025-08", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "gpt-5.1-chat-latest", - "name": "OpenAI GPT-5.1 Chat", - "display_name": "OpenAI GPT-5.1 Chat", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMaxAI/MiniMax-M2.5", + "display_name": "MiniMaxAI/MiniMax-M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 197000, + "output": 131000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "Anthropic: Claude 4.5 Haiku (20251001)", - "display_name": "Anthropic: Claude 4.5 Haiku (20251001)", + "id": "baidu/ERNIE-4.5-300B-A47B", + "name": "baidu/ERNIE-4.5-300B-A47B", + "display_name": "baidu/ERNIE-4.5-300B-A47B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -84446,21 +92571,18 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-10", - "release_date": "2025-10-01", - "last_updated": "2025-10-01", + "release_date": "2025-07-02", + "last_updated": "2025-11-25", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.09999999999999999, - "cache_write": 1.25 + "input": 0.28, + "output": 1.1 }, "type": "chat" }, { - "id": "sonar-reasoning", - "name": "Perplexity Sonar Reasoning", - "display_name": "Perplexity Sonar Reasoning", + "id": "stepfun-ai/Step-3.5-Flash", + "name": "stepfun-ai/Step-3.5-Flash", + "display_name": "stepfun-ai/Step-3.5-Flash", "modalities": { "input": [ "text" @@ -84470,42 +92592,42 @@ ] }, "limit": { - "context": 127000, - "output": 4096 + "context": 262000, + "output": 262000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2025-01-27", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 1, - "output": 5 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "claude-opus-4", - "name": "Anthropic: Claude Opus 4", - "display_name": "Anthropic: Claude Opus 4", + "id": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 66000, + "output": 66000 }, "temperature": true, "tool_call": true, @@ -84513,23 +92635,31 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-14", - "last_updated": "2025-05-14", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "llama-prompt-guard-2-86m", - "name": "Meta Llama Prompt Guard 2 86M", - "display_name": "Meta Llama Prompt Guard 2 86M", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen/Qwen3-235B-A22B-Thinking-2507", "modalities": { "input": [ "text" @@ -84539,29 +92669,40 @@ ] }, "limit": { - "context": 512, - "output": 2 + "context": 262000, + "output": 262000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "release_date": "2025-07-28", + "last_updated": "2025-11-25", "cost": { - "input": 0.01, - "output": 0.01 + "input": 0.13, + "output": 0.6 }, "type": "chat" }, { - "id": "gpt-4.1-nano", - "name": "OpenAI GPT-4.1 Nano", - "display_name": "OpenAI GPT-4.1 Nano", + "id": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "name": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "display_name": "Qwen/Qwen3-VL-235B-A22B-Thinking", "modalities": { "input": [ "text", @@ -84572,30 +92713,40 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.09999999999999999, - "output": 0.39999999999999997, - "cache_read": 0.024999999999999998 + "input": 0.45, + "output": 3.5 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", "modalities": { "input": [ "text" @@ -84605,8 +92756,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -84615,54 +92766,61 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-31", - "last_updated": "2025-07-31", + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.09999999999999999, - "output": 0.3 + "input": 0.14, + "output": 1.4 }, "type": "chat" }, { - "id": "claude-3.5-haiku", - "name": "Anthropic: Claude 3.5 Haiku", - "display_name": "Anthropic: Claude 3.5 Haiku", + "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "name": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "display_name": "Qwen/Qwen3-Next-80B-A3B-Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2025-09-25", + "last_updated": "2025-11-25", "cost": { - "input": 0.7999999999999999, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "grok-3-mini", - "name": "xAI Grok 3 Mini", - "display_name": "xAI Grok 3 Mini", + "id": "Qwen/Qwen3-32B", + "name": "Qwen/Qwen3-32B", + "display_name": "Qwen/Qwen3-32B", "modalities": { "input": [ "text" @@ -84672,79 +92830,70 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 0.5, - "cache_read": 0.075 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "o3", - "name": "OpenAI o3", - "display_name": "OpenAI o3", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "display_name": "Qwen/Qwen3-30B-A3B-Instruct-2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2025-07-30", + "last_updated": "2025-11-25", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.09, + "output": 0.3 }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "Qwen/Qwen3-8B", + "name": "Qwen/Qwen3-8B", + "display_name": "Qwen/Qwen3-8B", "modalities": { "input": [ "text" @@ -84754,8 +92903,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -84764,24 +92913,29 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.27, - "output": 0.41 + "input": 0.06, + "output": 0.06 }, "type": "chat" }, { - "id": "gpt-oss-20b", - "name": "OpenAI GPT-OSS 20b", - "display_name": "OpenAI GPT-OSS 20b", + "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", "modalities": { "input": [ "text" @@ -84791,35 +92945,28 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2025-08-01", + "last_updated": "2025-11-25", "cost": { - "input": 0.049999999999999996, - "output": 0.19999999999999998 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "gpt-5-pro", - "name": "OpenAI: GPT-5 Pro", - "display_name": "OpenAI: GPT-5 Pro", + "id": "Qwen/Qwen2.5-14B-Instruct", + "name": "Qwen/Qwen2.5-14B-Instruct", + "display_name": "Qwen/Qwen2.5-14B-Instruct", "modalities": { "input": [ "text" @@ -84829,78 +92976,61 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 33000, + "output": 4000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": false, + "open_weights": false, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 15, - "output": 120 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "llama-guard-4", - "name": "Meta Llama Guard 4 12B", - "display_name": "Meta Llama Guard 4 12B", + "id": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 1024 + "context": 66000, + "output": 66000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.21, - "output": 0.21 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "gpt-4o", - "name": "OpenAI GPT-4o", - "display_name": "OpenAI GPT-4o", + "id": "Qwen/Qwen2.5-VL-72B-Instruct", + "name": "Qwen/Qwen2.5-VL-72B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-72B-Instruct", "modalities": { "input": [ "text", @@ -84911,54 +93041,50 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "release_date": "2025-01-28", + "last_updated": "2025-11-25", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.59, + "output": 0.59 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b-instruct", - "name": "Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen3 VL 235B A22B Instruct", + "id": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { "input": 0.3, "output": 1.5 @@ -84966,113 +93092,84 @@ "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "Google Gemini 2.5 Flash Lite", - "display_name": "Google Gemini 2.5 Flash Lite", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "display_name": "Qwen/Qwen3-235B-A22B-Instruct-2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-22", - "last_updated": "2025-07-22", + "release_date": "2025-07-23", + "last_updated": "2025-11-25", "cost": { - "input": 0.09999999999999999, - "output": 0.39999999999999997, - "cache_read": 0.024999999999999998, - "cache_write": 0.09999999999999999 + "input": 0.09, + "output": 0.6 }, "type": "chat" }, { - "id": "qwen3-coder", - "name": "Qwen3 Coder 480B A35B Instruct Turbo", - "display_name": "Qwen3 Coder 480B A35B Instruct Turbo", + "id": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 66000, + "output": 66000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.22, - "output": 0.95 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "gpt-5", - "name": "OpenAI GPT-5", - "display_name": "OpenAI GPT-5", + "id": "Qwen/QwQ-32B", + "name": "Qwen/QwQ-32B", + "display_name": "Qwen/QwQ-32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131000, + "output": 131000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -85081,84 +93178,72 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-03-06", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 + "input": 0.15, + "output": 0.58 }, "type": "chat" }, { - "id": "ernie-4.5-21b-a3b-thinking", - "name": "Baidu Ernie 4.5 21B A3B Thinking", - "display_name": "Baidu Ernie 4.5 21B A3B Thinking", + "id": "Qwen/Qwen3-VL-32B-Instruct", + "name": "Qwen/Qwen3-VL-32B-Instruct", + "display_name": "Qwen/Qwen3-VL-32B-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8000 + "context": 262000, + "output": 262000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-03-16", - "last_updated": "2025-03-16", + "release_date": "2025-10-21", + "last_updated": "2025-11-25", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "OpenAI GPT-OSS 120b", - "display_name": "OpenAI GPT-OSS 120b", + "id": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "name": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "display_name": "Qwen/Qwen3-VL-30B-A3B-Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -85168,24 +93253,29 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2025-10-11", + "last_updated": "2025-11-25", "cost": { - "input": 0.04, - "output": 0.16 + "input": 0.29, + "output": 1 }, "type": "chat" }, { - "id": "gpt-5-chat-latest", - "name": "OpenAI GPT-5 Chat Latest", - "display_name": "OpenAI GPT-5 Chat Latest", + "id": "Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen/Qwen2.5-VL-32B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-32B-Instruct", "modalities": { "input": [ "text", @@ -85196,99 +93286,91 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131000, + "output": 131000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-09-30", - "last_updated": "2024-09-30", + "release_date": "2025-03-24", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 + "input": 0.27, + "output": 0.27 }, "type": "chat" }, { - "id": "claude-4.5-sonnet", - "name": "Anthropic: Claude Sonnet 4.5", - "display_name": "Anthropic: Claude Sonnet 4.5", + "id": "Qwen/Qwen2.5-72B-Instruct-128K", + "name": "Qwen/Qwen2.5-72B-Instruct-128K", + "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.30000000000000004, - "cache_write": 3.75 + "input": 0.59, + "output": 0.59 }, "type": "chat" }, { - "id": "deepseek-v3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "Qwen/Qwen3-VL-8B-Instruct", + "name": "Qwen/Qwen3-VL-8B-Instruct", + "display_name": "Qwen/Qwen3-VL-8B-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-26", - "last_updated": "2024-12-26", + "release_date": "2025-10-15", + "last_updated": "2025-11-25", "cost": { - "input": 0.56, - "output": 1.68, - "cache_read": 0.07 + "input": 0.18, + "output": 0.68 }, "type": "chat" }, { - "id": "llama-3.1-8b-instruct", - "name": "Meta Llama 3.1 8B Instruct", - "display_name": "Meta Llama 3.1 8B Instruct", + "id": "Qwen/Qwen2.5-7B-Instruct", + "name": "Qwen/Qwen2.5-7B-Instruct", + "display_name": "Qwen/Qwen2.5-7B-Instruct", "modalities": { "input": [ "text" @@ -85298,8 +93380,8 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 33000, + "output": 4000 }, "temperature": true, "tool_call": true, @@ -85308,19 +93390,18 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.02, - "output": 0.049999999999999996 + "input": 0.05, + "output": 0.05 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "OpenAI GPT-4.1", - "display_name": "OpenAI GPT-4.1", + "id": "Qwen/Qwen2.5-VL-7B-Instruct", + "name": "Qwen/Qwen2.5-VL-7B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-7B-Instruct", "modalities": { "input": [ "text", @@ -85331,30 +93412,28 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 33000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-01-28", + "last_updated": "2025-11-25", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.05, + "output": 0.05 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "Qwen/Qwen3-14B", + "name": "Qwen/Qwen3-14B", + "display_name": "Qwen/Qwen3-14B", "modalities": { "input": [ "text" @@ -85364,8 +93443,8 @@ ] }, "limit": { - "context": 256000, - "output": 262144 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -85385,31 +93464,29 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.48, - "output": 2 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "OpenAI GPT-4.1 Mini", - "display_name": "OpenAI GPT-4.1 Mini", + "id": "Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 33000, + "output": 4000 }, "temperature": true, "tool_call": true, @@ -85418,111 +93495,92 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2024-11-11", + "last_updated": "2025-11-25", "cost": { - "input": 0.39999999999999997, - "output": 1.5999999999999999, - "cache_read": 0.09999999999999999 + "input": 0.18, + "output": 0.18 }, "type": "chat" }, { - "id": "deepseek-v3.1-terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", + "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "name": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-VL-30B-A3B-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "release_date": "2025-10-05", + "last_updated": "2025-11-25", "cost": { - "input": 0.27, - "output": 1, - "cache_read": 0.21600000000000003 + "input": 0.29, + "output": 1 }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "OpenAI: GPT-5.1 Codex", - "display_name": "OpenAI: GPT-5.1 Codex", + "id": "Qwen/Qwen3-235B-A22B", + "name": "Qwen/Qwen3-235B-A22B", + "display_name": "Qwen/Qwen3-235B-A22B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131000, + "output": 131000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 + "input": 0.35, + "output": 1.42 }, "type": "chat" }, { - "id": "grok-3", - "name": "xAI Grok 3", - "display_name": "xAI Grok 3", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "display_name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", "modalities": { "input": [ "text" @@ -85532,8 +93590,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -85542,97 +93600,62 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2025-07-31", + "last_updated": "2025-11-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "grok-4-fast-non-reasoning", - "name": "xAI Grok 4 Fast Non-Reasoning", - "display_name": "xAI Grok 4 Fast Non-Reasoning", + "id": "Qwen/Qwen3-VL-8B-Thinking", + "name": "Qwen/Qwen3-VL-8B-Thinking", + "display_name": "Qwen/Qwen3-VL-8B-Thinking", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", - "cost": { - "input": 0.19999999999999998, - "output": 0.5, - "cache_read": 0.049999999999999996 - }, - "type": "chat" - }, - { - "id": "sonar-reasoning-pro", - "name": "Perplexity Sonar Reasoning Pro", - "display_name": "Perplexity Sonar Reasoning Pro", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 127000, - "output": 4096 - }, - "temperature": true, - "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2025-01-27", + "release_date": "2025-10-15", + "last_updated": "2025-11-25", "cost": { - "input": 2, - "output": 8 + "input": 0.18, + "output": 2 }, "type": "chat" - } - ] - }, - "zai-coding-plan": { - "id": "zai-coding-plan", - "name": "Z.AI Coding Plan", - "display_name": "Z.AI Coding Plan", - "api": "https://api.z.ai/api/coding/paas/v4", - "doc": "https://docs.z.ai/devpack/overview", - "models": [ + }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "name": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "display_name": "Qwen/Qwen3-30B-A3B-Thinking-2507", "modalities": { "input": [ "text" @@ -85642,8 +93665,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -85663,22 +93686,19 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": false, + "release_date": "2025-07-31", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.09, + "output": 0.3 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "Qwen/Qwen2.5-32B-Instruct", + "name": "Qwen/Qwen2.5-32B-Instruct", + "display_name": "Qwen/Qwen2.5-32B-Instruct", "modalities": { "input": [ "text" @@ -85688,42 +93708,28 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 33000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "release_date": "2024-09-19", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.18, + "output": 0.18 }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen/Qwen2.5-72B-Instruct", + "display_name": "Qwen/Qwen2.5-72B-Instruct", "modalities": { "input": [ "text" @@ -85733,43 +93739,40 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 33000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": false, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.59, + "output": 0.59 }, "type": "chat" }, { - "id": "glm-5-turbo", - "name": "GLM-5-Turbo", - "display_name": "GLM-5-Turbo", + "id": "Qwen/Qwen3-VL-32B-Thinking", + "name": "Qwen/Qwen3-VL-32B-Thinking", + "display_name": "Qwen/Qwen3-VL-32B-Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -85788,36 +93791,31 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "release_date": "2025-10-21", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.2, + "output": 1.5 }, "type": "chat" }, { - "id": "glm-5v-turbo", - "name": "GLM-5V-Turbo", - "display_name": "GLM-5V-Turbo", + "id": "inclusionAI/Ring-flash-2.0", + "name": "inclusionAI/Ring-flash-2.0", + "display_name": "inclusionAI/Ring-flash-2.0", "modalities": { "input": [ - "text", - "image", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -85827,39 +93825,23 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "release_date": "2025-09-29", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.14, + "output": 0.57 }, "type": "chat" - } - ] - }, - "amazon-bedrock": { - "id": "amazon-bedrock", - "name": "Amazon Bedrock", - "display_name": "Amazon Bedrock", - "doc": "https://docs.aws.amazon.com/bedrock/latest/userguide/models-supported.html", - "models": [ + }, { - "id": "openai.gpt-oss-safeguard-120b", - "name": "GPT OSS Safeguard 120B", - "display_name": "GPT OSS Safeguard 120B", + "id": "inclusionAI/Ling-flash-2.0", + "name": "inclusionAI/Ling-flash-2.0", + "display_name": "inclusionAI/Ling-flash-2.0", "modalities": { "input": [ "text" @@ -85869,8 +93851,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -85879,18 +93861,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "nvidia.nemotron-nano-3-30b", - "name": "NVIDIA Nemotron Nano 3 30B", - "display_name": "NVIDIA Nemotron Nano 3 30B", + "id": "inclusionAI/Ling-mini-2.0", + "name": "inclusionAI/Ling-mini-2.0", + "display_name": "inclusionAI/Ling-mini-2.0", "modalities": { "input": [ "text" @@ -85900,29 +93882,28 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": false, + "release_date": "2025-09-10", + "last_updated": "2025-11-25", "cost": { - "input": 0.06, - "output": 0.24 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "nvidia.nemotron-super-3-120b", - "name": "NVIDIA Nemotron 3 Super 120B A12B", - "display_name": "NVIDIA Nemotron 3 Super 120B A12B", + "id": "deepseek-ai/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -85932,8 +93913,8 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -85941,20 +93922,33 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "release_date": "2026-03-11", - "last_updated": "2026-03-11", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.15, - "output": 0.65 + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "writer.palmyra-x5-v1:0", - "name": "Palmyra X5", - "display_name": "Palmyra X5", + "id": "deepseek-ai/deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -85964,8 +93958,8 @@ ] }, "limit": { - "context": 1040000, - "output": 8192 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -85973,55 +93967,86 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.6, - "output": 6 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" - }, + } + ] + }, + "google-vertex": { + "id": "google-vertex", + "name": "Vertex", + "display_name": "Vertex", + "doc": "https://cloud.google.com/vertex-ai/generative-ai/docs/models", + "models": [ { - "id": "mistral.ministral-3-8b-instruct", - "name": "Ministral 3 8B", - "display_name": "Ministral 3 8B", + "id": "gemini-flash-latest", + "name": "Gemini Flash Latest", + "display_name": "Gemini Flash Latest", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.383 }, "type": "chat" }, { - "id": "au.anthropic.claude-opus-4-6-v1", - "name": "AU Anthropic Claude Opus 4.6", - "display_name": "AU Anthropic Claude Opus 4.6", + "id": "gemini-2.5-flash-preview-09-2025", + "name": "Gemini 2.5 Flash Preview 09-25", + "display_name": "Gemini 2.5 Flash Preview 09-25", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -86029,94 +94054,186 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", + "default_enabled": true, + "mode": "budget", "budget": { - "min": 1024, + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, "unit": "tokens" }, - "effort": "medium", - "effort_options": [ + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.383 + }, + "type": "chat" + }, + { + "id": "gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ "low", - "medium", "high" ], - "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 16.5, - "output": 82.5, - "cache_read": 1.65, - "cache_write": 20.625 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "mistral.ministral-3-3b-instruct", - "name": "Ministral 3 3B", - "display_name": "Ministral 3 3B", + "id": "gemini-2.5-flash-lite-preview-06-17", + "name": "Gemini 2.5 Flash Lite Preview 06-17", + "display_name": "Gemini 2.5 Flash Lite Preview 06-17", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { "input": 0.1, - "output": 0.1 + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "anthropic.claude-sonnet-4-5-20250929-v1:0", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -86124,8 +94241,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -86133,33 +94250,57 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.383 }, "type": "chat" }, { - "id": "mistral.devstral-2-123b", - "name": "Devstral 2 123B", - "display_name": "Devstral 2 123B", + "id": "gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 1048576, "output": 8192 }, "temperature": true, @@ -86167,24 +94308,25 @@ "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "attachment": true, + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.4, - "output": 2 + "input": 0.15, + "output": 0.6, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "global.anthropic.claude-opus-4-5-20251101-v1:0", - "name": "Claude Opus 4.5 (Global)", - "display_name": "Claude Opus 4.5 (Global)", + "id": "deepseek-ai/deepseek-v3.1-maas", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text", - "image", "pdf" ], "output": [ @@ -86192,8 +94334,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 163840, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -86201,136 +94343,141 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.6, + "output": 1.7 }, "type": "chat" }, { - "id": "mistral.voxtral-small-24b-2507", - "name": "Voxtral Small 24B 2507", - "display_name": "Voxtral Small 24B 2507", + "id": "deepseek-ai/deepseek-v3.2-maas", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text", - "audio" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "release_date": "2025-12-17", + "last_updated": "2026-04-04", "cost": { - "input": 0.15, - "output": 0.35 + "input": 0.56, + "output": 1.68, + "cache_read": 0.056 }, "type": "chat" }, { - "id": "google.gemma-3-12b-it", - "name": "Google Gemma 3 12B", - "display_name": "Google Gemma 3 12B", + "id": "moonshotai/kimi-k2-thinking-maas", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.049999999999999996, - "output": 0.09999999999999999 + "input": 0.6, + "output": 2.5 }, "type": "chat" }, { - "id": "amazon.nova-pro-v1:0", - "name": "Nova Pro", - "display_name": "Nova Pro", + "id": "openai/gpt-oss-20b-maas", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 8192 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.8, - "output": 3.2, - "cache_read": 0.2 + "input": 0.07, + "output": 0.25 }, "type": "chat" }, { - "id": "anthropic.claude-haiku-4-5-20251001-v1:0", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "openai/gpt-oss-120b-maas", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -86338,23 +94485,20 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.09, + "output": 0.36 }, "type": "chat" }, { - "id": "minimax.minimax-m2", - "name": "MiniMax M2", - "display_name": "MiniMax M2", + "id": "zai-org/glm-5-maas", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -86364,8 +94508,8 @@ ] }, "limit": { - "context": 204608, - "output": 128000 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -86373,24 +94517,35 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.3, - "output": 1.2 + "input": 1, + "output": 3.2, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "global.anthropic.claude-opus-4-7", - "name": "Claude Opus 4.7 (Global)", - "display_name": "Claude Opus 4.7 (Global)", + "id": "zai-org/glm-4.7-maas", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text", - "image", "pdf" ], "output": [ @@ -86398,162 +94553,144 @@ ] }, "limit": { - "context": 1000000, + "context": 200000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], "interleaved": true, "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-06", + "last_updated": "2026-01-06", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "mistral.pixtral-large-2502-v1:0", - "name": "Pixtral Large (25.02)", - "display_name": "Pixtral Large (25.02)", + "id": "qwen/qwen3-235b-a22b-instruct-2507-maas", + "name": "Qwen3 235B A22B Instruct", + "display_name": "Qwen3 235B A22B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-08", - "last_updated": "2025-04-08", + "open_weights": true, + "release_date": "2025-08-13", + "last_updated": "2025-08-13", "cost": { - "input": 2, - "output": 6 + "input": 0.22, + "output": 0.88 }, "type": "chat" }, { - "id": "meta.llama4-maverick-17b-instruct-v1:0", - "name": "Llama 4 Maverick 17B Instruct", - "display_name": "Llama 4 Maverick 17B Instruct", + "id": "meta/llama-3.3-70b-instruct-maas", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 16384 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2023-12", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.24, - "output": 0.97 + "input": 0.72, + "output": 0.72 }, "type": "chat" }, { - "id": "us.anthropic.claude-sonnet-4-5-20250929-v1:0", - "name": "Claude Sonnet 4.5 (US)", - "display_name": "Claude Sonnet 4.5 (US)", + "id": "meta/llama-4-maverick-17b-128e-instruct-maas", + "name": "Llama 4 Maverick 17B 128E Instruct", + "display_name": "Llama 4 Maverick 17B 128E Instruct", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 524288, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.35, + "output": 1.15 }, "type": "chat" }, { - "id": "us.anthropic.claude-haiku-4-5-20251001-v1:0", - "name": "Claude Haiku 4.5 (US)", - "display_name": "Claude Haiku 4.5 (US)", + "id": "gemini-3.1-flash-lite", + "name": "Gemini 3.1 Flash Lite", + "display_name": "Gemini 3.1 Flash Lite", "modalities": { "input": [ "text", "image", + "video", + "audio", "pdf" ], "output": [ @@ -86561,8 +94698,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -86570,60 +94707,34 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", - "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 - }, - "type": "chat" - }, - { - "id": "amazon.nova-micro-v1:0", - "name": "Nova Micro", - "display_name": "Nova Micro", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true + } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "knowledge": "2025-01", + "release_date": "2026-05-07", + "last_updated": "2026-05-07", "cost": { - "input": 0.035, - "output": 0.14, - "cache_read": 0.00875 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "global.anthropic.claude-sonnet-4-5-20250929-v1:0", - "name": "Claude Sonnet 4.5 (Global)", - "display_name": "Claude Sonnet 4.5 (Global)", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -86631,8 +94742,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -86640,65 +94751,72 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" - }, - { - "id": "openai.gpt-oss-20b-1:0", - "name": "gpt-oss-20b", - "display_name": "gpt-oss-20b", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + }, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } ] }, - "limit": { - "context": 128000, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", - "cost": { - "input": 0.07, - "output": 0.3 - }, "type": "chat" }, { - "id": "zai.glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "gemini-2.5-flash-preview-04-17", + "name": "Gemini 2.5 Flash Preview 04-17", + "display_name": "Gemini 2.5 Flash Preview 04-17", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 101376 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -86709,39 +94827,54 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-04-17", + "last_updated": "2025-04-17", "cost": { - "input": 1, - "output": 3.2 + "input": 0.15, + "output": 0.6, + "cache_read": 0.0375 }, "type": "chat" }, { - "id": "qwen.qwen3-32b-v1:0", - "name": "Qwen3 32B (dense)", - "display_name": "Qwen3 32B (dense)", + "id": "gemini-2.5-flash-preview-05-20", + "name": "Gemini 2.5 Flash Preview 05-20", + "display_name": "Gemini 2.5 Flash Preview 05-20", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -86749,32 +94882,57 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { "input": 0.15, - "output": 0.6 + "output": 0.6, + "cache_read": 0.0375 }, "type": "chat" }, { - "id": "deepseek.v3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "gemini-2.5-pro-preview-06-05", + "name": "Gemini 2.5 Pro Preview 06-05", + "display_name": "Gemini 2.5 Pro Preview 06-05", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 81920 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -86782,25 +94940,47 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2026-02-06", - "last_updated": "2026-02-06", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "cost": { - "input": 0.62, - "output": 1.85 + "input": 1.25, + "output": 10, + "cache_read": 0.31 }, "type": "chat" }, { - "id": "eu.anthropic.claude-haiku-4-5-20251001-v1:0", - "name": "Claude Haiku 4.5 (EU)", - "display_name": "Claude Haiku 4.5 (EU)", + "id": "gemini-2.5-pro-preview-05-06", + "name": "Gemini 2.5 Pro Preview 05-06", + "display_name": "Gemini 2.5 Pro Preview 05-06", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -86808,8 +94988,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -86817,60 +94997,104 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2025-01", + "release_date": "2025-05-06", + "last_updated": "2025-05-06", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 1.25, + "output": 10, + "cache_read": 0.31 }, "type": "chat" }, { - "id": "zai.glm-4.7-flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "gemini-2.5-flash-lite-preview-09-2025", + "name": "Gemini 2.5 Flash Lite Preview 09-25", + "display_name": "Gemini 2.5 Flash Lite Preview 09-25", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.07, - "output": 0.4 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "us.anthropic.claude-opus-4-7", - "name": "Claude Opus 4.7 (US)", - "display_name": "Claude Opus 4.7 (US)", + "id": "gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -86878,10 +95102,10 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -86891,80 +95115,82 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, "summaries": true, + "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.1, + "output": 0.4, + "cache_read": 0.01, + "input_audio": 0.3 }, "type": "chat" }, { - "id": "amazon.nova-2-lite-v1:0", - "name": "Nova 2 Lite", - "display_name": "Nova 2 Lite", + "id": "gemini-flash-lite-latest", + "name": "Gemini Flash-Lite Latest", + "display_name": "Gemini Flash-Lite Latest", "modalities": { "input": [ "text", "image", - "video" + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.33, - "output": 2.75 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "anthropic.claude-opus-4-5-20251101-v1:0", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "display_name": "Gemini 2.0 Flash Lite", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -86972,135 +95198,221 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen.qwen3-coder-480b-a35b-v1:0", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "gemini-3.1-pro-preview-customtools", + "name": "Gemini 3.1 Pro Preview Custom Tools", + "display_name": "Gemini 3.1 Pro Preview Custom Tools", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 1048576, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.22, - "output": 1.8 + "input": 2, + "output": 12, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "amazon.nova-lite-v1:0", - "name": "Nova Lite", - "display_name": "Nova Lite", + "id": "gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ "text", "image", - "video" + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "knowledge": "2025-01", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.06, - "output": 0.24, - "cache_read": 0.015 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "meta.llama3-1-8b-instruct-v1:0", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.22, - "output": 0.22 + "input": 2, + "output": 12, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "anthropic.claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ "text", "image", + "video", + "audio", "pdf" ], "output": [ @@ -87108,102 +95420,103 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", "low", "medium", - "high", - "xhigh" + "high" ], - "interleaved": true, "summaries": true, + "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "input_audio": 1 }, "type": "chat" }, { - "id": "google.gemma-3-27b-it", - "name": "Google Gemma 3 27B Instruct", - "display_name": "Google Gemma 3 27B Instruct", + "id": "gemini-embedding-001", + "name": "Gemini Embedding 001", + "display_name": "Gemini Embedding 001", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 8192 + "context": 2048, + "output": 3072 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-27", - "last_updated": "2025-07-27", + "attachment": false, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 0.12, - "output": 0.2 + "input": 0.15, + "output": 0 }, - "type": "chat" - }, + "type": "embedding" + } + ] + }, + "databricks": { + "id": "databricks", + "name": "Databricks", + "display_name": "Databricks", + "api": "https://${DATABRICKS_HOST}/ai-gateway/mlflow/v1", + "doc": "https://docs.databricks.com/aws/en/machine-learning/foundation-models/", + "models": [ { - "id": "global.anthropic.claude-haiku-4-5-20251001-v1:0", - "name": "Claude Haiku 4.5 (Global)", - "display_name": "Claude Haiku 4.5 (Global)", + "id": "databricks-gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -87211,99 +95524,119 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.05, + "output": 0.2 }, "type": "chat" }, { - "id": "google.gemma-3-4b-it", - "name": "Gemma 3 4B IT", - "display_name": "Gemma 3 4B IT", + "id": "databricks-gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.04, - "output": 0.08 + "input": 0.072, + "output": 0.28 }, "type": "chat" }, { - "id": "meta.llama4-scout-17b-instruct-v1:0", - "name": "Llama 4 Scout 17B Instruct", - "display_name": "Llama 4 Scout 17B Instruct", + "id": "databricks-gemini-3-pro", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 3500000, - "output": 16384 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.17, - "output": 0.66 + "input": 2, + "output": 12, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "deepseek.v3-v1:0", - "name": "DeepSeek-V3.1", - "display_name": "DeepSeek-V3.1", + "id": "databricks-claude-sonnet-4-5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 81920 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -87311,33 +95644,38 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.58, - "output": 1.68 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "mistral.magistral-small-2509", - "name": "Magistral Small 1.2", - "display_name": "Magistral Small 1.2", + "id": "databricks-gemini-3-1-flash-lite", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 40000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -87345,62 +95683,99 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "qwen.qwen3-next-80b-a3b", - "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "id": "databricks-claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.14, - "output": 1.4 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "zai.glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "databricks-claude-opus-4-1", + "name": "Claude Opus 4.1 (latest)", + "display_name": "Claude Opus 4.1 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -87408,74 +95783,64 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.6, - "output": 2.2 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "moonshot.kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "databricks-gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.6, - "output": 2.5 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "us.anthropic.claude-opus-4-5-20251101-v1:0", - "name": "Claude Opus 4.5 (US)", - "display_name": "Claude Opus 4.5 (US)", + "id": "databricks-gemini-3-flash", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ "text", "image", + "video", + "audio", "pdf" ], "output": [ @@ -87483,8 +95848,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -87494,148 +95859,191 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "input_audio": 1 }, "type": "chat" }, { - "id": "mistral.ministral-3-14b-instruct", - "name": "Ministral 14B 3.0", - "display_name": "Ministral 14B 3.0", + "id": "databricks-gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "deepseek.r1-v1:0", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "databricks-claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-29", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 1.35, - "output": 5.4 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "mistral.voxtral-mini-3b-2507", - "name": "Voxtral Mini 3B 2507", - "display_name": "Voxtral Mini 3B 2507", + "id": "databricks-claude-opus-4-5", + "name": "Claude Opus 4.5 (latest)", + "display_name": "Claude Opus 4.5 (latest)", "modalities": { "input": [ - "audio", - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.04, - "output": 0.04 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openai.gpt-oss-120b-1:0", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "databricks-gpt-5-4-nano", + "name": "GPT-5.4 nano", + "display_name": "GPT-5.4 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "nvidia.nemotron-nano-12b-v2", - "name": "NVIDIA Nemotron Nano 12B v2 VL BF16", - "display_name": "NVIDIA Nemotron Nano 12B v2 VL BF16", + "id": "databricks-gpt-5-2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", @@ -87646,28 +96054,31 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.2, - "output": 0.6 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "eu.anthropic.claude-opus-4-7", - "name": "Claude Opus 4.7 (EU)", - "display_name": "Claude Opus 4.7 (EU)", + "id": "databricks-claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", @@ -87726,105 +96137,61 @@ "type": "chat" }, { - "id": "minimax.minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "databricks-gpt-5-4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 98304 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", - "cost": { - "input": 0.3, - "output": 1.2 - }, - "type": "chat" - }, - { - "id": "meta.llama3-3-70b-instruct-v1:0", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.72, - "output": 0.72 - }, - "type": "chat" - }, - { - "id": "meta.llama3-1-70b-instruct-v1:0", - "name": "Llama 3.1 70B Instruct", - "display_name": "Llama 3.1 70B Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + }, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } ] }, - "limit": { - "context": 128000, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 0.72, - "output": 0.72 - }, "type": "chat" }, { - "id": "eu.anthropic.claude-sonnet-4-5-20250929-v1:0", - "name": "Claude Sonnet 4.5 (EU)", - "display_name": "Claude Sonnet 4.5 (EU)", + "id": "databricks-claude-sonnet-4", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", @@ -87859,24 +96226,23 @@ "type": "chat" }, { - "id": "eu.anthropic.claude-opus-4-5-20251101-v1:0", - "name": "Claude Opus 4.5 (EU)", - "display_name": "Claude Opus 4.5 (EU)", + "id": "databricks-gpt-5-4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -87884,64 +96250,78 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "moonshotai.kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "databricks-gpt-5-5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-06", - "last_updated": "2026-02-06", + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0.6, - "output": 3 + "input": 5, + "output": 30, + "cache_read": 0.5, + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + }, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "au.anthropic.claude-sonnet-4-6", - "name": "AU Anthropic Claude Sonnet 4.6", - "display_name": "AU Anthropic Claude Sonnet 4.6", + "id": "databricks-gemini-2-5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -87949,132 +96329,134 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-08", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 3.3, - "output": 16.5, - "cache_read": 0.33, - "cache_write": 4.125 + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + }, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "openai.gpt-oss-safeguard-20b", - "name": "GPT OSS Safeguard 20B", - "display_name": "GPT OSS Safeguard 20B", + "id": "databricks-gemini-2-5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.07, - "output": 0.2 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 }, "type": "chat" }, { - "id": "qwen.qwen3-coder-30b-a3b-v1:0", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "databricks-gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "minimax.minimax-m2.1", - "name": "MiniMax M2.1", - "display_name": "MiniMax M2.1", + "id": "databricks-claude-haiku-4-5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -88082,84 +96464,121 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.3, - "output": 1.2 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "qwen.qwen3-vl-235b-a22b", - "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "id": "databricks-gemini-3-1-pro", + "name": "Gemini 3.1 Pro Preview Custom Tools", + "display_name": "Gemini 3.1 Pro Preview Custom Tools", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.3, - "output": 1.5 + "input": 2, + "output": 12, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "qwen.qwen3-coder-next", - "name": "Qwen3 Coder Next", - "display_name": "Qwen3 Coder Next", + "id": "databricks-gpt-5-1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-06", - "last_updated": "2026-02-06", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.22, - "output": 1.8 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" - }, + } + ] + }, + "berget": { + "id": "berget", + "name": "Berget.AI", + "display_name": "Berget.AI", + "api": "https://api.berget.ai/v1", + "doc": "https://api.berget.ai", + "models": [ { - "id": "nvidia.nemotron-nano-9b-v2", - "name": "NVIDIA Nemotron Nano 9B v2", - "display_name": "NVIDIA Nemotron Nano 9B v2", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS-120B", + "display_name": "GPT-OSS-120B", "modalities": { "input": [ "text" @@ -88170,61 +96589,81 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.06, - "output": 0.23 + "input": 0.44, + "output": 0.99 }, "type": "chat" - }, - { - "id": "mistral.mistral-large-3-675b-instruct", - "name": "Mistral Large 3", - "display_name": "Mistral Large 3", + }, + { + "id": "zai-org/GLM-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 128000, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "knowledge": "2025-12", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.77, + "output": 2.75 }, "type": "chat" }, { - "id": "qwen.qwen3-235b-a22b-2507-v1:0", - "name": "Qwen3 235B A22B 2507", - "display_name": "Qwen3 235B A22B 2507", + "id": "mistralai/Mistral-Medium-3.5-128B", + "name": "Mistral Medium 3.5 128B", + "display_name": "Mistral Medium 3.5 128B", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -88238,23 +96677,24 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "knowledge": "2026-04", + "release_date": "2026-04-29", + "last_updated": "2026-04-29", "cost": { - "input": 0.22, - "output": 0.88 + "input": 1.65, + "output": 5.5 }, "type": "chat" }, { - "id": "writer.palmyra-x4-v1:0", - "name": "Palmyra X4", - "display_name": "Palmyra X4", + "id": "mistralai/Mistral-Small-3.2-24B-Instruct-2506", + "name": "Mistral Small 3.2 24B Instruct 2506", + "display_name": "Mistral Small 3.2 24B Instruct 2506", "modalities": { "input": [ "text" @@ -88264,7 +96704,7 @@ ] }, "limit": { - "context": 122880, + "context": 32000, "output": 8192 }, "temperature": true, @@ -88274,32 +96714,34 @@ "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", "cost": { - "input": 2.5, - "output": 10 + "input": 0.33, + "output": 0.33 }, "type": "chat" }, { - "id": "anthropic.claude-opus-4-1-20250805-v1:0", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "google/gemma-4-31B-it", + "name": "Gemma 4 31B Instruct", + "display_name": "Gemma 4 31B Instruct", "modalities": { "input": [ - "text", + "audio", "image", - "pdf" + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -88308,22 +96750,20 @@ "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.275, + "output": 0.55 }, "type": "chat" }, { - "id": "us.deepseek.r1-v1:0", - "name": "DeepSeek-R1 (US)", - "display_name": "DeepSeek-R1 (US)", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -88334,7 +96774,7 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -88343,129 +96783,122 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-29", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-04-27", + "last_updated": "2025-04-27", "cost": { - "input": 1.35, - "output": 5.4 + "input": 0.99, + "output": 0.99 }, "type": "chat" }, { - "id": "eu.anthropic.claude-opus-4-6-v1", - "name": "Claude Opus 4.6 (EU)", - "display_name": "Claude Opus 4.6 (EU)", + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-05-07", + "last_updated": "2026-05-07", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.83, + "output": 3.85, + "cache_read": 0.16 }, "type": "chat" - }, + } + ] + }, + "moonshot": { + "id": "moonshot", + "name": "Moonshot AI (China)", + "display_name": "Moonshot AI (China)", + "api": "https://api.moonshot.cn/v1", + "doc": "https://platform.moonshot.cn/docs/api/chat", + "models": [ { - "id": "us.meta.llama4-maverick-17b-instruct-v1:0", - "name": "Llama 4 Maverick 17B Instruct (US)", - "display_name": "Llama 4 Maverick 17B Instruct (US)", + "id": "kimi-k2-turbo-preview", + "name": "Kimi K2 Turbo", + "display_name": "Kimi K2 Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.24, - "output": 0.97 + "input": 2.4, + "output": 10, + "cache_read": 0.6 }, "type": "chat" }, { - "id": "au.anthropic.claude-haiku-4-5-20251001-v1:0", - "name": "Claude Haiku 4.5 (AU)", - "display_name": "Claude Haiku 4.5 (AU)", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -88473,36 +96906,44 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "jp.anthropic.claude-sonnet-4-5-20250929-v1:0", - "name": "Claude Sonnet 4.5 (JP)", - "display_name": "Claude Sonnet 4.5 (JP)", + "id": "kimi-k2-thinking-turbo", + "name": "Kimi K2 Thinking Turbo", + "display_name": "Kimi K2 Thinking Turbo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -88510,343 +96951,251 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1.15, + "output": 8, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "anthropic.claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "kimi-k2-0711-preview", + "name": "Kimi K2 0711", + "display_name": "Kimi K2 0711", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "jp.anthropic.claude-sonnet-4-6", - "name": "Claude Sonnet 4.6 (JP)", - "display_name": "Claude Sonnet 4.6 (JP)", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "global.anthropic.claude-sonnet-4-6", - "name": "Claude Sonnet 4.6 (Global)", - "display_name": "Claude Sonnet 4.6 (Global)", + "id": "kimi-k2-0905-preview", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "us.anthropic.claude-sonnet-4-6", - "name": "Claude Sonnet 4.6 (US)", - "display_name": "Claude Sonnet 4.6 (US)", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" - }, + } + ] + }, + "alibaba-coding-plan-cn": { + "id": "alibaba-coding-plan-cn", + "name": "Alibaba Coding Plan (China)", + "display_name": "Alibaba Coding Plan (China)", + "api": "https://coding.dashscope.aliyuncs.com/v1", + "doc": "https://help.aliyun.com/zh/model-studio/coding-plan", + "models": [ { - "id": "global.anthropic.claude-opus-4-6-v1", - "name": "Claude Opus 4.6 (Global)", - "display_name": "Claude Opus 4.6 (Global)", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "us.anthropic.claude-opus-4-6-v1", - "name": "Claude Opus 4.6 (US)", - "display_name": "Claude Opus 4.6 (US)", + "id": "qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -88854,107 +97203,88 @@ }, "limit": { "context": 1000000, - "output": 128000 + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "us.anthropic.claude-opus-4-1-20250805-v1:0", - "name": "Claude Opus 4.1 (US)", - "display_name": "Claude Opus 4.1 (US)", + "id": "qwen3-coder-next", + "name": "Qwen3 Coder Next", + "display_name": "Qwen3 Coder Next", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-03", + "last_updated": "2026-02-03", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "au.anthropic.claude-sonnet-4-5-20250929-v1:0", - "name": "Claude Sonnet 4.5 (AU)", - "display_name": "Claude Sonnet 4.5 (AU)", + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -88962,252 +97292,258 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "eu.anthropic.claude-sonnet-4-6", - "name": "Claude Sonnet 4.6 (EU)", - "display_name": "Claude Sonnet 4.6 (EU)", + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 196608, + "output": 24576 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "us.meta.llama4-scout-17b-instruct-v1:0", - "name": "Llama 4 Scout 17B Instruct (US)", - "display_name": "Llama 4 Scout 17B Instruct (US)", + "id": "qwen3-max-2026-01-23", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 3500000, - "output": 16384 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-01-23", + "last_updated": "2026-01-23", "cost": { - "input": 0.17, - "output": 0.66 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "anthropic.claude-opus-4-6-v1", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 202752, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "jp.anthropic.claude-opus-4-7", - "name": "Claude Opus 4.7 (JP)", - "display_name": "Claude Opus 4.7 (JP)", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 202752, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], "interleaved": true, "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" + }, + { + "id": "qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" } ] }, - "the-grid-ai": { - "id": "the-grid-ai", - "name": "The Grid AI", - "display_name": "The Grid AI", - "api": "https://api.thegrid.ai/v1", - "doc": "https://thegrid.ai/docs", + "minimax-cn": { + "id": "minimax-cn", + "name": "MiniMax (minimaxi.com)", + "display_name": "MiniMax (minimaxi.com)", + "api": "https://api.minimaxi.com/anthropic/v1", + "doc": "https://platform.minimaxi.com/docs/guides/quickstart", "models": [ { - "id": "text-prime", - "name": "Text Prime", - "display_name": "Text Prime", + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -89217,8 +97553,8 @@ ] }, "limit": { - "context": 128000, - "output": 30000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -89226,16 +97562,25 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "cost": { + "input": 0.3, + "output": 1.2 + }, "type": "chat" }, { - "id": "text-standard", - "name": "Text Standard", - "display_name": "Text Standard", + "id": "MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ "text" @@ -89245,8 +97590,8 @@ ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -89254,16 +97599,33 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.06, + "cache_write": 0.375 + }, "type": "chat" }, { - "id": "text-max", - "name": "Text Max", - "display_name": "Text Max", + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -89273,8 +97635,8 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -89282,25 +97644,27 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-24", - "last_updated": "2026-03-24", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 + }, "type": "chat" - } - ] - }, - "baseten": { - "id": "baseten", - "name": "Baseten", - "display_name": "Baseten", - "api": "https://inference.baseten.co/v1", - "doc": "https://docs.baseten.co/development/model-apis/overview", - "models": [ + }, { - "id": "zai-org/GLM-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "MiniMax-M2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ "text" @@ -89332,19 +97696,20 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { "input": 0.6, - "output": 2.2 + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "zai-org/GLM-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "MiniMax-M2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "display_name": "MiniMax-M2.5-highspeed", "modalities": { "input": [ "text" @@ -89354,7 +97719,7 @@ ] }, "limit": { - "context": 202752, + "context": 204800, "output": 131072 }, "temperature": true, @@ -89365,30 +97730,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2026-02-13", + "last_updated": "2026-02-13", "cost": { - "input": 0.95, - "output": 3.15 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ "text" @@ -89398,13 +97758,14 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 196608, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -89413,19 +97774,27 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-08-31", - "release_date": "2025-09-16", - "last_updated": "2025-09-16", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0.3, + "output": 1.2 }, "type": "chat" - }, + } + ] + }, + "chutes": { + "id": "chutes", + "name": "Chutes", + "display_name": "Chutes", + "api": "https://llm.chutes.ai/v1", + "doc": "https://llm.chutes.ai/v1/models", + "models": [ { - "id": "nvidia/Nemotron-120B-A12B", - "name": "Nemotron 3 Super", - "display_name": "Nemotron 3 Super", + "id": "deepseek-ai/DeepSeek-R1-0528-TEE", + "name": "DeepSeek R1 0528 TEE", + "display_name": "DeepSeek R1 0528 TEE", "modalities": { "input": [ "text" @@ -89435,8 +97804,8 @@ ] }, "limit": { - "context": 262144, - "output": 32678 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -89457,19 +97826,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2026-02", - "release_date": "2026-03-11", - "last_updated": "2026-03-11", + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.3, - "output": 0.75 + "input": 0.45, + "output": 2.15, + "cache_read": 0.225 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "deepseek-ai/DeepSeek-V3.1-TEE", + "name": "DeepSeek V3.1 TEE", + "display_name": "DeepSeek V3.1 TEE", "modalities": { "input": [ "text" @@ -89479,8 +97848,8 @@ ] }, "limit": { - "context": 164000, - "output": 131000 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -89488,20 +97857,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-08-25", - "last_updated": "2025-08-25", + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.27, + "output": 1, + "cache_read": 0.135 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3-0324", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "deepseek-ai/DeepSeek-V3-0324-TEE", + "name": "DeepSeek V3 0324 TEE", + "display_name": "DeepSeek V3 0324 TEE", "modalities": { "input": [ "text" @@ -89511,8 +97892,8 @@ ] }, "limit": { - "context": 164000, - "output": 131000 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -89521,19 +97902,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.77, - "output": 0.77 + "input": 0.25, + "output": 1, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ "text" @@ -89543,8 +97924,8 @@ ] }, "limit": { - "context": 163800, - "output": 131100 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -89565,19 +97946,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-10", - "release_date": "2025-12-01", - "last_updated": "2026-03-06", + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.3, - "output": 0.45 + "input": 0.0272, + "output": 0.1087, + "cache_read": 0.0136 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "deepseek-ai/DeepSeek-V3.2-TEE", + "name": "DeepSeek V3.2 TEE", + "display_name": "DeepSeek V3.2 TEE", "modalities": { "input": [ "text" @@ -89587,8 +97968,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -89598,27 +97979,35 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.1, - "output": 0.5 + "input": 0.28, + "output": 0.42, + "cache_read": 0.14 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "moonshotai/Kimi-K2.5-TEE", + "name": "Kimi K2.5 TEE", + "display_name": "Kimi K2.5 TEE", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -89626,7 +98015,7 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 65535 }, "temperature": true, "tool_call": true, @@ -89645,21 +98034,22 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2026-03-06", + "knowledge": "2024-10", + "release_date": "2026-01-27", + "last_updated": "2026-04-25", "cost": { - "input": 0.6, - "output": 2.5 + "input": 0.44, + "output": 2, + "cache_read": 0.22 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "moonshotai/Kimi-K2.6-TEE", + "name": "Kimi K2.6 TEE", + "display_name": "Kimi K2.6 TEE", "modalities": { "input": [ "text", @@ -89672,7 +98062,7 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 65535 }, "temperature": true, "tool_call": true, @@ -89693,52 +98083,20 @@ }, "attachment": true, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "knowledge": "2025-12", + "release_date": "2026-04-20", + "last_updated": "2026-04-25", "cost": { "input": 0.95, "output": 4, - "cache_read": 0.16 - }, - "type": "chat" - }, - { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "Kimi K2 Instruct 0905", - "display_name": "Kimi K2 Instruct 0905", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 262144 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-09-05", - "last_updated": "2026-03-06", - "cost": { - "input": 0.6, - "output": 2.5 + "cache_read": 0.475 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "openai/gpt-oss-120b-TEE", + "name": "gpt oss 120b TEE", + "display_name": "gpt oss 120b TEE", "modalities": { "input": [ "text" @@ -89748,8 +98106,8 @@ ] }, "limit": { - "context": 262144, - "output": 8192 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -89768,21 +98126,21 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-01-30", - "last_updated": "2026-02-12", + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.6, - "output": 3 + "input": 0.09, + "output": 0.36, + "cache_read": 0.045 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "zai-org/GLM-5-TEE", + "name": "GLM 5 TEE", + "display_name": "GLM 5 TEE", "modalities": { "input": [ "text" @@ -89792,8 +98150,8 @@ ] }, "limit": { - "context": 204000, - "output": 204000 + "context": 202752, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -89814,19 +98172,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2026-02-14", + "last_updated": "2026-04-25", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.95, + "output": 2.55, + "cache_read": 0.475 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V4-Pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "zai-org/GLM-4.7-TEE", + "name": "GLM 4.7 TEE", + "display_name": "GLM 4.7 TEE", "modalities": { "input": [ "text" @@ -89836,8 +98194,8 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 202752, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -89858,41 +98216,30 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.15 + "input": 0.39, + "output": 1.75, + "cache_read": 0.195 }, "type": "chat" - } - ] - }, - "frogbot": { - "id": "frogbot", - "name": "FrogBot", - "display_name": "FrogBot", - "api": "https://app.frogbot.ai/api/v1", - "doc": "https://docs.frogbot.ai", - "models": [ + }, { - "id": "grok-4-1-fast-reasoning", - "name": "Grok 4.1 Fast (Reasoning)", - "display_name": "Grok 4.1 Fast (Reasoning)", + "id": "zai-org/GLM-4.7-FP8", + "name": "GLM 4.7 FP8", + "display_name": "GLM 4.7 FP8", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 128000 + "context": 202752, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -89900,40 +98247,32 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-25", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-04-25", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.2989, + "output": 1.1957, + "cache_read": 0.14945 }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "zai-org/GLM-5.1-TEE", + "name": "GLM 5.1 TEE", + "display_name": "GLM 5.1 TEE", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 202752, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -89943,38 +98282,41 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-08", + "last_updated": "2026-04-25", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 1.05, + "output": 3.5, + "cache_read": 0.525 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi-K2.5", - "display_name": "Kimi-K2.5", + "id": "zai-org/GLM-5-Turbo", + "name": "GLM 5 Turbo", + "display_name": "GLM 5 Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 202752, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -89994,201 +98336,130 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "1970-01-01", - "last_updated": "1970-01-01", + "open_weights": true, + "release_date": "2026-03-11", + "last_updated": "2026-04-25", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 0.4891, + "output": 1.9565, + "cache_read": 0.24455 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "zai-org/GLM-4.6V", + "name": "GLM 4.6V", + "display_name": "GLM 4.6V", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.3, + "output": 0.9, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "unsloth/gemma-3-27b-it", + "name": "gemma 3 27b it", + "display_name": "gemma 3 27b it", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 128000, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 + "input": 0.0272, + "output": 0.1087, + "cache_read": 0.0136 }, "type": "chat" }, { - "id": "claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "unsloth/Mistral-Nemo-Instruct-2407", + "name": "Mistral Nemo Instruct 2407", + "display_name": "Mistral Nemo Instruct 2407", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 131072, + "output": 131072 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.02, + "output": 0.04, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "zai-glm-5-1", - "name": "Z.AI GLM-5.1", - "display_name": "Z.AI GLM-5.1", + "id": "unsloth/Llama-3.2-3B-Instruct", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ "text" @@ -90198,121 +98469,94 @@ ] }, "limit": { - "context": 198000, - "output": 8192 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-01-20", - "last_updated": "2025-02-22", + "release_date": "2025-02-12", + "last_updated": "2026-04-25", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 0.01, + "output": 0.0136, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "unsloth/gemma-3-12b-it", + "name": "gemma 3 12b it", + "display_name": "gemma 3 12b it", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 + "input": 0.03, + "output": 0.1, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "Grok 4.1 Fast (Non-Reasoning)", - "display_name": "Grok 4.1 Fast (Non-Reasoning)", + "id": "unsloth/Llama-3.2-1B-Instruct", + "name": "Llama 3.2 1B Instruct", + "display_name": "Llama 3.2 1B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 128000 + "context": 16384, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-25", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-04-25", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.01, + "output": 0.0109, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "gpt-5-4-nano", - "name": "GPT-5.4 Nano", - "display_name": "GPT-5.4 Nano", + "id": "unsloth/gemma-3-4b-it", + "name": "gemma 3 4b it", + "display_name": "gemma 3 4b it", "modalities": { "input": [ "text", @@ -90323,68 +98567,40 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 96000, + "output": 96000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 0.01, + "output": 0.0272, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "NousResearch/Hermes-4-14B", + "name": "Hermes 4 14B", + "display_name": "Hermes 4 14B", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 40960, + "output": 40960 }, "temperature": true, "tool_call": true, @@ -90395,39 +98611,29 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-07-17", - "last_updated": "2025-07-17", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075 + "input": 0.0136, + "output": 0.0543, + "cache_read": 0.0068 }, "type": "chat" }, { - "id": "grok-code-fast-1", - "name": "Grok 4.1 Fast (Reasoning)", - "display_name": "Grok 4.1 Fast (Reasoning)", + "id": "NousResearch/DeepHermes-3-Mistral-24B-Preview", + "name": "DeepHermes 3 Mistral 24B Preview", + "display_name": "DeepHermes 3 Mistral 24B Preview", "modalities": { "input": [ "text" @@ -90437,36 +98643,29 @@ ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 0.0245, + "output": 0.0978, + "cache_read": 0.01225 }, "type": "chat" }, { - "id": "gpt-5-5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "rednote-hilab/dots.ocr", + "name": "dots.ocr", + "display_name": "dots.ocr", "modalities": { "input": [ "text", @@ -90477,65 +98676,41 @@ ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 131072, + "output": 131072 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 0.01, + "output": 0.0109, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "grok-4-3", - "name": "Grok 4.3", - "display_name": "Grok 4.3", + "id": "google/gemma-4-31B-turbo-TEE", + "name": "gemma 4 31B turbo TEE", + "display_name": "gemma 4 31B turbo TEE", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -90544,141 +98719,141 @@ "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2026-04-30", - "last_updated": "2026-04-30", + "open_weights": true, + "release_date": "2026-04-25", + "last_updated": "2026-04-25", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2 + "input": 0.13, + "output": 0.38, + "cache_read": 0.065 }, "type": "chat" }, { - "id": "gpt-5-4-mini", - "name": "GPT-5.4 Mini", - "display_name": "GPT-5.4 Mini", + "id": "XiaomiMiMo/MiMo-V2-Flash-TEE", + "name": "MiMo V2 Flash TEE", + "display_name": "MiMo V2 Flash TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-04-25", + "last_updated": "2026-04-25", + "cost": { + "input": 0.09, + "output": 0.29, + "cache_read": 0.045 + }, + "type": "chat" + }, + { + "id": "MiniMaxAI/MiniMax-M2.5-TEE", + "name": "MiniMax M2.5 TEE", + "display_name": "MiniMax M2.5 TEE", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 196608, + "output": 65536 + }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-15", + "last_updated": "2026-04-25", "cost": { - "input": 0.75, - "output": 4.5, + "input": 0.15, + "output": 1.2, "cache_read": 0.075 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "Qwen/Qwen3.5-397B-A17B-TEE", + "name": "Qwen3.5 397B A17B TEE", + "display_name": "Qwen3.5 397B A17B TEE", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "open_weights": true, + "release_date": "2026-02-18", + "last_updated": "2026-04-25", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.39, + "output": 2.34, + "cache_read": 0.195 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek v4 Pro", - "display_name": "DeepSeek v4 Pro", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ "text" @@ -90688,13 +98863,14 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -90707,22 +98883,21 @@ ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2026-01", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.14 + "input": 0.11, + "output": 0.6, + "cache_read": 0.055 }, "type": "chat" }, { - "id": "gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ "text" @@ -90732,69 +98907,61 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "1970-01-01", - "last_updated": "1970-01-01", + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.07, - "output": 0.2 + "input": 0.1, + "output": 0.8, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "qwen-3-6-plus", - "name": "Qwen 3.6 Plus", - "display_name": "Qwen 3.6 Plus", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507-TEE", + "name": "Qwen3 235B A22B Instruct 2507 TEE", + "display_name": "Qwen3 235B A22B Instruct 2507 TEE", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-03", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.1 + "input": 0.1, + "output": 0.6, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "minimax-m2-7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "Qwen/Qwen3Guard-Gen-0.6B", + "name": "Qwen3Guard Gen 0.6B", + "display_name": "Qwen3Guard Gen 0.6B", "modalities": { "input": [ "text" @@ -90804,30 +98971,29 @@ ] }, "limit": { - "context": 192000, + "context": 32768, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.01, + "output": 0.0109, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "minimax-m2-5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "Qwen/Qwen3-30B-A3B", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ "text" @@ -90837,30 +99003,41 @@ ] }, "limit": { - "context": 192000, - "output": 8192 + "context": 40960, + "output": 40960 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-01-15", - "last_updated": "2025-02-22", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.3, - "output": 1.2, + "input": 0.06, + "output": 0.22, "cache_read": 0.03 }, "type": "chat" }, { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen2.5 VL 32B Instruct", + "display_name": "Qwen2.5 VL 32B Instruct", "modalities": { "input": [ "text", @@ -90871,30 +99048,29 @@ ] }, "limit": { - "context": 128000, + "context": 16384, "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.0543, + "output": 0.2174, + "cache_read": 0.02715 }, "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "Qwen/Qwen3-32B-TEE", + "name": "Qwen3 32B TEE", + "display_name": "Qwen3 32B TEE", "modalities": { "input": [ "text" @@ -90904,8 +99080,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 40960, + "output": 40960 }, "temperature": true, "tool_call": true, @@ -90913,97 +99089,85 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": true, - "release_date": "1970-01-01", - "last_updated": "1970-01-01", + "release_date": "2026-04-25", + "last_updated": "2026-04-25", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.08, + "output": 0.24, + "cache_read": 0.04 }, "type": "chat" }, { - "id": "gemini-3-1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "Qwen/Qwen3-Coder-Next-TEE", + "name": "Qwen3 Coder Next TEE", + "display_name": "Qwen3 Coder Next TEE", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2026-01", - "release_date": "2026-02-18", - "last_updated": "2026-02-18", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-25", + "last_updated": "2026-04-25", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2 + "input": 0.12, + "output": 0.75, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "kimi-k2-6", - "name": "Kimi-K2.6", - "display_name": "Kimi-K2.6", + "id": "Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen2.5 Coder 32B Instruct", + "display_name": "Qwen2.5 Coder 32B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "1970-01-01", - "last_updated": "1970-01-01", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.0272, + "output": 0.1087, + "cache_read": 0.0136 }, "type": "chat" }, { - "id": "gpt-5-3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "Qwen/Qwen3.6-27B-TEE", + "name": "Qwen3.6 27B TEE", + "display_name": "Qwen3.6 27B TEE", "modalities": { "input": [ "text", @@ -91014,10 +99178,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -91026,97 +99190,61 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-02-15", - "last_updated": "2026-02-15", + "open_weights": true, + "release_date": "2026-04-25", + "last_updated": "2026-04-25", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.195, + "output": 1.56, + "cache_read": 0.0975 }, "type": "chat" - } - ] - }, - "zhipuai-coding-plan": { - "id": "zhipuai-coding-plan", - "name": "Zhipu AI Coding Plan", - "display_name": "Zhipu AI Coding Plan", - "api": "https://open.bigmodel.cn/api/coding/paas/v4", - "doc": "https://docs.bigmodel.cn/cn/coding-plan/overview", - "models": [ + }, { - "id": "glm-5v-turbo", - "name": "GLM-5V-Turbo", - "display_name": "GLM-5V-Turbo", + "id": "Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen2.5 72B Instruct", + "display_name": "Qwen2.5 72B Instruct", "modalities": { "input": [ - "text", - "image", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.2989, + "output": 1.1957, + "cache_read": 0.14945 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "tngtech/DeepSeek-TNG-R1T2-Chimera-TEE", + "name": "DeepSeek TNG R1T2 Chimera TEE", + "display_name": "DeepSeek TNG R1T2 Chimera TEE", "modalities": { "input": [ "text" @@ -91126,8 +99254,8 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, @@ -91135,33 +99263,30 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "open_weights": true, + "release_date": "2026-04-25", + "last_updated": "2026-04-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.3, + "output": 1.1, + "cache_read": 0.15 }, "type": "chat" - }, + } + ] + }, + "siliconflow": { + "id": "siliconflow", + "name": "SiliconFlow", + "display_name": "SiliconFlow", + "api": "https://api.siliconflow.cn/v1", + "doc": "https://cloud.siliconflow.com/models", + "models": [ { - "id": "glm-5-turbo", - "name": "GLM-5-Turbo", - "display_name": "GLM-5-Turbo", + "id": "Pro/deepseek-ai/DeepSeek-R1", + "name": "Pro/deepseek-ai/DeepSeek-R1", + "display_name": "Pro/deepseek-ai/DeepSeek-R1", "modalities": { "input": [ "text" @@ -91171,8 +99296,8 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -91193,20 +99318,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "release_date": "2025-05-28", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.5, + "output": 2.18 }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", + "display_name": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", "modalities": { "input": [ "text" @@ -91217,7 +99340,7 @@ }, "limit": { "context": 131072, - "output": 98304 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -91226,22 +99349,19 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": false, + "release_date": "2025-09-29", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "Pro/deepseek-ai/DeepSeek-V3.2", + "name": "Pro/deepseek-ai/DeepSeek-V3.2", + "display_name": "Pro/deepseek-ai/DeepSeek-V3.2", "modalities": { "input": [ "text" @@ -91251,8 +99371,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, @@ -91262,41 +99382,23 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": false, + "release_date": "2025-12-03", + "last_updated": "2025-12-03", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.27, + "output": 0.42 }, "type": "chat" - } - ] - }, - "alibaba-coding-plan": { - "id": "alibaba-coding-plan", - "name": "Alibaba Coding Plan", - "display_name": "Alibaba Coding Plan", - "api": "https://coding-intl.dashscope.aliyuncs.com/v1", - "doc": "https://www.alibabacloud.com/help/en/model-studio/coding-plan", - "models": [ + }, { - "id": "qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "Pro/deepseek-ai/DeepSeek-V3", + "name": "Pro/deepseek-ai/DeepSeek-V3", + "display_name": "Pro/deepseek-ai/DeepSeek-V3", "modalities": { "input": [ "text" @@ -91306,8 +99408,8 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -91315,35 +99417,30 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "release_date": "2024-12-26", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "Pro/moonshotai/Kimi-K2-Thinking", + "name": "Pro/moonshotai/Kimi-K2-Thinking", + "display_name": "Pro/moonshotai/Kimi-K2-Thinking", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -91362,34 +99459,32 @@ ] } }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "attachment": false, + "open_weights": false, + "release_date": "2025-11-07", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.55, + "output": 2.5 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "Pro/moonshotai/Kimi-K2.6", + "name": "Pro/moonshotai/Kimi-K2.6", + "display_name": "Pro/moonshotai/Kimi-K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -91410,32 +99505,31 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "Pro/moonshotai/Kimi-K2.5", + "name": "Pro/moonshotai/Kimi-K2.5", + "display_name": "Pro/moonshotai/Kimi-K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -91455,21 +99549,50 @@ } }, "attachment": false, + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "cost": { + "input": 0.45, + "output": 2.25 + }, + "type": "chat" + }, + { + "id": "Pro/moonshotai/Kimi-K2-Instruct-0905", + "name": "Pro/moonshotai/Kimi-K2-Instruct-0905", + "display_name": "Pro/moonshotai/Kimi-K2-Instruct-0905", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2025-09-08", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "Pro/zai-org/GLM-4.7", + "name": "Pro/zai-org/GLM-4.7", + "display_name": "Pro/zai-org/GLM-4.7", "modalities": { "input": [ "text" @@ -91479,8 +99602,8 @@ ] }, "limit": { - "context": 196608, - "output": 24576 + "context": 205000, + "output": 205000 }, "temperature": true, "tool_call": true, @@ -91500,34 +99623,30 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "Pro/zai-org/GLM-5", + "name": "Pro/zai-org/GLM-5", + "display_name": "Pro/zai-org/GLM-5", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 205000, + "output": 205000 }, "temperature": true, "tool_call": true, @@ -91547,22 +99666,19 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 1, + "output": 3.2 }, "type": "chat" }, { - "id": "qwen3-max-2026-01-23", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "Pro/zai-org/GLM-5.1", + "name": "Pro/zai-org/GLM-5.1", + "display_name": "Pro/zai-org/GLM-5.1", "modalities": { "input": [ "text" @@ -91572,13 +99688,14 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 205000, + "output": 205000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -91592,22 +99709,20 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-01-23", - "last_updated": "2026-01-23", + "open_weights": true, + "release_date": "2026-04-08", + "last_updated": "2026-04-08", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, + "input": 1.4, + "output": 4.4, "cache_write": 0 }, "type": "chat" }, { - "id": "qwen3-coder-next", - "name": "Qwen3 Coder Next", - "display_name": "Qwen3 Coder Next", + "id": "Pro/MiniMaxAI/MiniMax-M2.1", + "name": "Pro/MiniMaxAI/MiniMax-M2.1", + "display_name": "Pro/MiniMaxAI/MiniMax-M2.1", "modalities": { "input": [ "text" @@ -91617,49 +99732,49 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 197000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-03", - "last_updated": "2026-02-03", + "open_weights": false, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "qwen3.5-plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "Pro/MiniMaxAI/MiniMax-M2.5", + "name": "Pro/MiniMaxAI/MiniMax-M2.5", + "display_name": "Pro/MiniMaxAI/MiniMax-M2.5", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 192000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -91674,32 +99789,20 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "release_date": "2026-02-13", + "last_updated": "2026-02-13", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.3, + "output": 1.22 }, "type": "chat" - } - ] - }, - "venice": { - "id": "venice", - "name": "Venice AI", - "display_name": "Venice AI", - "doc": "https://docs.venice.ai", - "models": [ + }, { - "id": "openai-gpt-4o-mini-2024-07-18", - "name": "GPT-4o Mini", - "display_name": "GPT-4o Mini", + "id": "deepseek-ai/DeepSeek-OCR", + "name": "deepseek-ai/DeepSeek-OCR", + "display_name": "deepseek-ai/DeepSeek-OCR", "modalities": { "input": [ - "text", "image" ], "output": [ @@ -91707,29 +99810,27 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-02-28", - "last_updated": "2026-03-06", + "open_weights": true, + "release_date": "2025-10-20", + "last_updated": "2025-10-20", "cost": { - "input": 0.1875, - "output": 0.75, - "cache_read": 0.09375 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "qwen3-next-80b", - "name": "Qwen 3 Next 80b", - "display_name": "Qwen 3 Next 80b", + "id": "deepseek-ai/deepseek-vl2", + "name": "deepseek-ai/deepseek-vl2", + "display_name": "deepseek-ai/deepseek-vl2", "modalities": { "input": [ "text" @@ -91739,68 +99840,59 @@ ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-04-29", - "last_updated": "2026-03-12", + "attachment": true, + "open_weights": false, + "release_date": "2024-12-13", + "last_updated": "2025-11-25", "cost": { - "input": 0.35, - "output": 1.9 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "grok-4-20-multi-agent", - "name": "Grok 4.20 Multi-Agent", - "display_name": "Grok 4.20 Multi-Agent", + "id": "deepseek-ai/DeepSeek-V3", + "name": "deepseek-ai/DeepSeek-V3", + "display_name": "deepseek-ai/DeepSeek-V3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 128000 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-12", - "last_updated": "2026-05-07", + "release_date": "2024-12-26", + "last_updated": "2025-11-25", "cost": { - "input": 1.42, - "output": 2.83, - "cache_read": 0.23, - "context_over_200k": { - "input": 2.83, - "output": 5.67, - "cache_read": 0.45 - } + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen 3 235B A22B Instruct 2507", - "display_name": "Qwen 3 235B A22B Instruct 2507", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "deepseek-ai/DeepSeek-V3.2", + "display_name": "deepseek-ai/DeepSeek-V3.2", "modalities": { "input": [ "text" @@ -91810,41 +99902,45 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-04-29", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2025-12-03", + "last_updated": "2025-12-03", "cost": { - "input": 0.15, - "output": 0.75 + "input": 0.27, + "output": 0.42 }, "type": "chat" }, { - "id": "z-ai-glm-5v-turbo", - "name": "GLM 5V Turbo", - "display_name": "GLM 5V Turbo", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -91852,65 +99948,63 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-12", + "release_date": "2025-01-20", + "last_updated": "2025-11-25", "cost": { - "input": 1.5, - "output": 5, - "cache_read": 0.3 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "gemma-4-uncensored", - "name": "Gemma 4 Uncensored", - "display_name": "Gemma 4 Uncensored", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 131072, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-13", - "last_updated": "2026-04-19", + "attachment": false, + "open_weights": false, + "release_date": "2025-01-20", + "last_updated": "2025-11-25", "cost": { - "input": 0.1625, - "output": 0.5 + "input": 0.18, + "output": 0.18 }, "type": "chat" }, { - "id": "grok-41-fast", - "name": "Grok 4.1 Fast", - "display_name": "Grok 4.1 Fast", + "id": "deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "deepseek-ai/DeepSeek-V3.1-Terminus", + "display_name": "deepseek-ai/DeepSeek-V3.1-Terminus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 30000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -91918,84 +100012,63 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-12-01", - "last_updated": "2026-04-09", + "release_date": "2025-09-29", + "last_updated": "2025-11-25", "cost": { - "input": 0.23, - "output": 0.57, - "cache_read": 0.06 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "deepseek-ai/DeepSeek-R1", + "name": "deepseek-ai/DeepSeek-R1", + "display_name": "deepseek-ai/DeepSeek-R1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-16", + "release_date": "2025-05-28", + "last_updated": "2025-11-25", "cost": { - "input": 3.6, - "output": 18, - "cache_read": 0.36, - "cache_write": 4.5 + "input": 0.5, + "output": 2.18 }, "type": "chat" }, { - "id": "nvidia-nemotron-cascade-2-30b-a3b", - "name": "Nemotron Cascade 2 30B A3B", - "display_name": "Nemotron Cascade 2 30B A3B", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "moonshotai/Kimi-K2-Instruct-0905", + "display_name": "moonshotai/Kimi-K2-Instruct-0905", "modalities": { "input": [ "text" @@ -92005,44 +100078,39 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-24", - "last_updated": "2026-04-09", + "open_weights": false, + "release_date": "2025-09-08", + "last_updated": "2025-11-25", "cost": { - "input": 0.14, - "output": 0.8 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "moonshotai/Kimi-K2-Thinking", + "display_name": "moonshotai/Kimi-K2-Thinking", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -92051,17 +100119,8 @@ "default": true }, "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "reasoning": { + "supported": true, "interleaved": true, "summaries": true, "visibility": "summary", @@ -92070,22 +100129,20 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-19", - "last_updated": "2026-03-12", + "release_date": "2025-11-07", + "last_updated": "2025-11-25", "cost": { - "input": 0.7, - "output": 3.75, - "cache_read": 0.07 + "input": 0.55, + "output": 2.5 }, "type": "chat" }, { - "id": "grok-4-20", - "name": "Grok 4.20", - "display_name": "Grok 4.20", + "id": "zai-org/GLM-4.6V", + "name": "zai-org/GLM-4.6V", + "display_name": "zai-org/GLM-4.6V", "modalities": { "input": [ "text", @@ -92096,8 +100153,8 @@ ] }, "limit": { - "context": 2000000, - "output": 128000 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -92107,117 +100164,85 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-03-12", - "last_updated": "2026-05-07", + "release_date": "2025-12-07", + "last_updated": "2025-12-07", "cost": { - "input": 1.42, - "output": 2.83, - "cache_read": 0.23, - "context_over_200k": { - "input": 2.83, - "output": 5.67, - "cache_read": 0.45 - } + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "google-gemma-4-26b-a4b-it", - "name": "Google Gemma 4 26B A4B Instruct", - "display_name": "Google Gemma 4 26B A4B Instruct", + "id": "zai-org/GLM-4.6", + "name": "zai-org/GLM-4.6", + "display_name": "zai-org/GLM-4.6", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 131072, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-12", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.1625, - "output": 0.5 + "input": 0.5, + "output": 1.9 }, "type": "chat" }, { - "id": "claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "zai-org/GLM-4.5V", + "name": "zai-org/GLM-4.5V", + "display_name": "zai-org/GLM-4.5V", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "release_date": "2025-08-13", + "last_updated": "2025-11-25", "cost": { - "input": 6, - "output": 30, - "cache_read": 0.6, - "cache_write": 7.5 + "input": 0.14, + "output": 0.86 }, "type": "chat" }, { - "id": "qwen3-coder-480b-a35b-instruct-turbo", - "name": "Qwen 3 Coder 480B Turbo", - "display_name": "Qwen 3 Coder 480B Turbo", + "id": "zai-org/GLM-4.5-Air", + "name": "zai-org/GLM-4.5-Air", + "display_name": "zai-org/GLM-4.5-Air", "modalities": { "input": [ "text" @@ -92227,8 +100252,8 @@ ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -92236,54 +100261,50 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-02-26", + "open_weights": false, + "release_date": "2025-07-28", + "last_updated": "2025-11-25", "cost": { - "input": 0.35, - "output": 1.5, - "cache_read": 0.04 + "input": 0.14, + "output": 0.86 }, "type": "chat" }, { - "id": "qwen3-5-397b-a17b", - "name": "Qwen 3.5 397B", - "display_name": "Qwen 3.5 397B", + "id": "THUDM/GLM-Z1-9B-0414", + "name": "THUDM/GLM-Z1-9B-0414", + "display_name": "THUDM/GLM-Z1-9B-0414", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-16", - "last_updated": "2026-04-16", + "attachment": false, + "open_weights": false, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.75, - "output": 4.5 + "input": 0.086, + "output": 0.086 }, "type": "chat" }, { - "id": "zai-org-glm-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "THUDM/GLM-4-9B-0414", + "name": "THUDM/GLM-4-9B-0414", + "display_name": "THUDM/GLM-4-9B-0414", "modalities": { "input": [ "text" @@ -92293,76 +100314,59 @@ ] }, "limit": { - "context": 198000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-24", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.55, - "output": 2.65, - "cache_read": 0.11 + "input": 0.086, + "output": 0.086 }, "type": "chat" }, { - "id": "openai-gpt-54", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "THUDM/GLM-Z1-32B-0414", + "name": "THUDM/GLM-Z1-32B-0414", + "display_name": "THUDM/GLM-Z1-32B-0414", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-05", - "last_updated": "2026-03-09", + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 3.13, - "output": 18.8, - "cache_read": 0.313 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "zai-org-glm-4.7-flash", - "name": "GLM 4.7 Flash", - "display_name": "GLM 4.7 Flash", + "id": "THUDM/GLM-4-32B-0414", + "name": "THUDM/GLM-4-32B-0414", + "display_name": "THUDM/GLM-4-32B-0414", "modalities": { "input": [ "text" @@ -92372,29 +100376,28 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-29", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.125, - "output": 0.5 + "input": 0.27, + "output": 0.27 }, "type": "chat" }, { - "id": "nvidia-nemotron-3-nano-30b-a3b", - "name": "NVIDIA Nemotron 3 Nano 30B", - "display_name": "NVIDIA Nemotron 3 Nano 30B", + "id": "tencent/Hunyuan-MT-7B", + "name": "tencent/Hunyuan-MT-7B", + "display_name": "tencent/Hunyuan-MT-7B", "modalities": { "input": [ "text" @@ -92404,8 +100407,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -92413,62 +100416,50 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.075, - "output": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b", - "name": "Qwen3 VL 235B", - "display_name": "Qwen3 VL 235B", + "id": "tencent/Hunyuan-A13B-Instruct", + "name": "tencent/Hunyuan-A13B-Instruct", + "display_name": "tencent/Hunyuan-A13B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2026-01-16", - "last_updated": "2026-03-12", + "attachment": false, + "open_weights": false, + "release_date": "2025-06-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.25, - "output": 1.5 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "openai-gpt-53-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "PaddlePaddle/PaddleOCR-VL", + "name": "PaddlePaddle/PaddleOCR-VL", + "display_name": "PaddlePaddle/PaddleOCR-VL", "modalities": { "input": [ "text", @@ -92479,30 +100470,28 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-03-12", + "open_weights": true, + "release_date": "2025-10-16", + "last_updated": "2025-10-16", "cost": { - "input": 2.19, - "output": 17.5, - "cache_read": 0.219 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "venice-uncensored-1-2", - "name": "Venice Uncensored 1.2", - "display_name": "Venice Uncensored 1.2", + "id": "PaddlePaddle/PaddleOCR-VL-1.5", + "name": "PaddlePaddle/PaddleOCR-VL-1.5", + "display_name": "PaddlePaddle/PaddleOCR-VL-1.5", "modalities": { "input": [ "text", @@ -92513,28 +100502,28 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-19", + "release_date": "2026-01-29", + "last_updated": "2026-01-29", "cost": { - "input": 0.2, - "output": 0.9 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai-gpt-52", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "ascend-tribe/pangu-pro-moe", + "name": "ascend-tribe/pangu-pro-moe", + "display_name": "ascend-tribe/pangu-pro-moe", "modalities": { "input": [ "text" @@ -92544,31 +100533,28 @@ ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-13", - "last_updated": "2026-03-12", + "release_date": "2025-07-02", + "last_updated": "2026-01-16", "cost": { - "input": 2.19, - "output": 17.5, - "cache_read": 0.219 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "mistral-small-3-2-24b-instruct", - "name": "Mistral Small 3.2 24B Instruct", - "display_name": "Mistral Small 3.2 24B Instruct", + "id": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", "modalities": { "input": [ "text" @@ -92578,28 +100564,33 @@ ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-15", - "last_updated": "2026-03-16", + "open_weights": false, + "release_date": "2025-09-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.09375, - "output": 0.25 + "input": 0.21, + "output": 0.57 }, "type": "chat" }, { - "id": "minimax-m27", - "name": "MiniMax M2.7", - "display_name": "MiniMax M2.7", + "id": "Kwaipilot/KAT-Dev", + "name": "Kwaipilot/KAT-Dev", + "display_name": "Kwaipilot/KAT-Dev", "modalities": { "input": [ "text" @@ -92609,30 +100600,28 @@ ] }, "limit": { - "context": 198000, - "output": 32768 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-03-18", - "last_updated": "2026-04-12", + "release_date": "2025-09-27", + "last_updated": "2026-01-16", "cost": { - "input": 0.375, - "output": 1.5, - "cache_read": 0.075 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen 3 235B A22B Thinking 2507", - "display_name": "Qwen 3 235B A22B Thinking 2507", + "id": "baidu/ERNIE-4.5-300B-A47B", + "name": "baidu/ERNIE-4.5-300B-A47B", + "display_name": "baidu/ERNIE-4.5-300B-A47B", "modalities": { "input": [ "text" @@ -92642,54 +100631,39 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-04-29", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2025-07-02", + "last_updated": "2025-11-25", "cost": { - "input": 0.45, - "output": 3.5 + "input": 0.28, + "output": 1.1 }, "type": "chat" }, { - "id": "qwen3-5-35b-a3b", - "name": "Qwen 3.5 35B A3B", - "display_name": "Qwen 3.5 35B A3B", + "id": "stepfun-ai/Step-3.5-Flash", + "name": "stepfun-ai/Step-3.5-Flash", + "display_name": "stepfun-ai/Step-3.5-Flash", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -92697,32 +100671,33 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-25", - "last_updated": "2026-04-16", + "attachment": false, + "open_weights": false, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.3125, - "output": 1.25, - "cache_read": 0.15625 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "mercury-2", - "name": "Mercury 2", - "display_name": "Mercury 2", + "id": "Qwen/Qwen3.5-9B", + "name": "Qwen/Qwen3.5-9B", + "display_name": "Qwen/Qwen3.5-9B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 50000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -92730,65 +100705,91 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-20", - "last_updated": "2026-04-09", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.3125, - "output": 0.9375, - "cache_read": 0.03125 + "input": 0.22, + "output": 1.74 }, "type": "chat" }, { - "id": "google-gemma-3-27b-it", - "name": "Google Gemma 3 27B Instruct", - "display_name": "Google Gemma 3 27B Instruct", + "id": "Qwen/Qwen3.5-4B", + "name": "Qwen/Qwen3.5-4B", + "display_name": "Qwen/Qwen3.5-4B", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 198000, - "output": 16384 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-11-04", - "last_updated": "2026-03-12", + "knowledge": "2025-04", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.12, - "output": 0.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "olafangensan-glm-4.7-flash-heretic", - "name": "GLM 4.7 Flash Heretic", - "display_name": "GLM 4.7 Flash Heretic", + "id": "Qwen/Qwen3.5-122B-A10B", + "name": "Qwen/Qwen3.5-122B-A10B", + "display_name": "Qwen/Qwen3.5-122B-A10B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 24000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -92796,32 +100797,45 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "release_date": "2026-02-04", - "last_updated": "2026-03-12", + "knowledge": "2025-04", + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "cost": { - "input": 0.14, - "output": 0.8 + "input": 0.29, + "output": 2.32 }, "type": "chat" }, { - "id": "openai-gpt-55-pro", - "name": "GPT-5.5 Pro", - "display_name": "GPT-5.5 Pro", + "id": "Qwen/Qwen3.5-397B-A17B", + "name": "Qwen/Qwen3.5-397B-A17B", + "display_name": "Qwen/Qwen3.5-397B-A17B", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -92829,31 +100843,44 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-04-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 37.5, - "output": 225 + "input": 0.29, + "output": 1.74 }, "type": "chat" }, { - "id": "openai-gpt-52-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "Qwen/Qwen3.5-27B", + "name": "Qwen/Qwen3.5-27B", + "display_name": "Qwen/Qwen3.5-27B", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 262144, "output": 65536 }, "temperature": true, @@ -92862,65 +100889,91 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08", - "release_date": "2025-01-15", - "last_updated": "2026-03-12", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-25", + "last_updated": "2026-02-25", "cost": { - "input": 2.19, - "output": 17.5, - "cache_read": 0.219 + "input": 0.26, + "output": 2.09 }, "type": "chat" }, { - "id": "venice-uncensored-role-play", - "name": "Venice Role Play Uncensored", - "display_name": "Venice Role Play Uncensored", + "id": "Qwen/Qwen3.5-35B-A3B", + "name": "Qwen/Qwen3.5-35B-A3B", + "display_name": "Qwen/Qwen3.5-35B-A3B", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "release_date": "2026-02-20", - "last_updated": "2026-03-16", + "knowledge": "2025-04", + "release_date": "2026-02-25", + "last_updated": "2026-02-25", "cost": { - "input": 0.5, - "output": 2 + "input": 0.23, + "output": 1.86 }, "type": "chat" }, { - "id": "zai-org-glm-5", - "name": "GLM 5", - "display_name": "GLM 5", + "id": "Qwen/Qwen3.6-35B-A3B", + "name": "Qwen/Qwen3.6-35B-A3B", + "display_name": "Qwen/Qwen3.6-35B-A3B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 198000, - "output": 32000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -92941,30 +100994,31 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-03-12", + "knowledge": "2025-04", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 0.23, + "output": 1.86 }, "type": "chat" }, { - "id": "zai-org-glm-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "Qwen/Qwen3-VL-32B-Thinking", + "name": "Qwen/Qwen3-VL-32B-Thinking", + "display_name": "Qwen/Qwen3-VL-32B-Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 198000, - "output": 16384 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -92983,93 +101037,82 @@ ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-01", - "last_updated": "2026-04-04", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-21", + "last_updated": "2025-11-25", "cost": { - "input": 0.85, - "output": 2.75, - "cache_read": 0.3 + "input": 0.2, + "output": 1.5 }, "type": "chat" }, { - "id": "grok-4-3", - "name": "Grok 4.3", - "display_name": "Grok 4.3", + "id": "Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen/Qwen2.5-72B-Instruct", + "display_name": "Qwen/Qwen2.5-72B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-18", - "last_updated": "2026-05-04", + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 1.42, - "output": 2.83, - "cache_read": 0.23, - "context_over_200k": { - "input": 2.83, - "output": 5.67, - "cache_read": 0.45 - } + "input": 0.59, + "output": 0.59 }, "type": "chat" }, { - "id": "mistral-small-2603", - "name": "Mistral Small 4", - "display_name": "Mistral Small 4", + "id": "Qwen/Qwen2.5-32B-Instruct", + "name": "Qwen/Qwen2.5-32B-Instruct", + "display_name": "Qwen/Qwen2.5-32B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2026-03-16", - "last_updated": "2026-04-09", + "attachment": false, + "open_weights": false, + "release_date": "2024-09-19", + "last_updated": "2025-11-25", "cost": { - "input": 0.1875, - "output": 0.75 + "input": 0.18, + "output": 0.18 }, "type": "chat" }, { - "id": "openai-gpt-oss-120b", - "name": "OpenAI GPT OSS 120B", - "display_name": "OpenAI GPT OSS 120B", + "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "name": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "display_name": "Qwen/Qwen3-30B-A3B-Thinking-2507", "modalities": { "input": [ "text" @@ -93079,8 +101122,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -93088,21 +101131,31 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-11-06", - "last_updated": "2026-05-06", + "open_weights": false, + "release_date": "2025-07-31", + "last_updated": "2025-11-25", "cost": { - "input": 0.07, + "input": 0.09, "output": 0.3 }, "type": "chat" }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "Qwen/Qwen3-VL-8B-Thinking", + "name": "Qwen/Qwen3-VL-8B-Thinking", + "display_name": "Qwen/Qwen3-VL-8B-Thinking", "modalities": { "input": [ "text", @@ -93113,8 +101166,8 @@ ] }, "limit": { - "context": 198000, - "output": 32768 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -93124,58 +101177,90 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-12-06", - "last_updated": "2026-04-12", + "release_date": "2025-10-15", + "last_updated": "2025-11-25", "cost": { - "input": 6, - "output": 30, - "cache_read": 0.6, - "cache_write": 7.5 + "input": 0.18, + "output": 2 }, "type": "chat" }, { - "id": "qwen3-5-9b", - "name": "Qwen 3.5 9B", - "display_name": "Qwen 3.5 9B", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "display_name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-07-31", + "last_updated": "2025-11-25", + "cost": { + "input": 0.25, + "output": 1 + } + }, + { + "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "name": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-03-05", - "last_updated": "2026-04-19", + "open_weights": false, + "release_date": "2025-10-05", + "last_updated": "2025-11-25", "cost": { - "input": 0.1, - "output": 0.15 + "input": 0.29, + "output": 1 }, "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", "modalities": { "input": [ "text" @@ -93185,14 +101270,43 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-11-11", + "last_updated": "2025-11-25", + "cost": { + "input": 0.18, + "output": 0.18 + } + }, + { + "id": "Qwen/Qwen3-14B", + "name": "Qwen/Qwen3-14B", + "display_name": "Qwen/Qwen3-14B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true }, "extra_capabilities": { "reasoning": { @@ -93206,57 +101320,50 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-24", - "last_updated": "2026-04-29", + "open_weights": false, + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.17, - "output": 0.35, - "cache_read": 0.028 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "openai-gpt-54-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "Qwen/Qwen2.5-7B-Instruct", + "name": "Qwen/Qwen2.5-7B-Instruct", + "display_name": "Qwen/Qwen2.5-7B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-05", - "last_updated": "2026-03-09", - "cost": { - "input": 37.5, - "output": 225, - "context_over_200k": { - "input": 75, - "output": 337.5 - } + "attachment": false, + "open_weights": false, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", + "cost": { + "input": 0.05, + "output": 0.05 }, "type": "chat" }, { - "id": "openai-gpt-54-mini", - "name": "GPT-5.4 Mini", - "display_name": "GPT-5.4 Mini", + "id": "Qwen/Qwen3-VL-8B-Instruct", + "name": "Qwen/Qwen3-VL-8B-Instruct", + "display_name": "Qwen/Qwen3-VL-8B-Instruct", "modalities": { "input": [ "text", @@ -93267,30 +101374,28 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-31", + "release_date": "2025-10-15", + "last_updated": "2025-11-25", "cost": { - "input": 0.9375, - "output": 5.625, - "cache_read": 0.09375 + "input": 0.18, + "output": 0.68 }, "type": "chat" }, { - "id": "minimax-m25", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "Qwen/Qwen2.5-72B-Instruct-128K", + "name": "Qwen/Qwen2.5-72B-Instruct-128K", + "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", "modalities": { "input": [ "text" @@ -93300,41 +101405,28 @@ ] }, "limit": { - "context": 198000, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-04-12", + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.34, - "output": 1.19, - "cache_read": 0.04 + "input": 0.59, + "output": 0.59 }, "type": "chat" }, { - "id": "zai-org-glm-5-1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen/Qwen2.5-VL-32B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-32B-Instruct", "modalities": { "input": [ "text" @@ -93344,53 +101436,39 @@ ] }, "limit": { - "context": 200000, - "output": 24000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-07", - "last_updated": "2026-04-08", + "attachment": true, + "open_weights": false, + "release_date": "2025-03-24", + "last_updated": "2025-11-25", "cost": { - "input": 1.75, - "output": 5.5, - "cache_read": 0.325 + "input": 0.27, + "output": 0.27 }, "type": "chat" }, { - "id": "openai-gpt-55", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "name": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "display_name": "Qwen/Qwen3-VL-30B-A3B-Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -93398,122 +101476,105 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-04-23", - "last_updated": "2026-04-25", + "release_date": "2025-10-11", + "last_updated": "2025-11-25", "cost": { - "input": 6.25, - "output": 37.5, - "cache_read": 0.625, - "context_over_200k": { - "input": 12.5, - "output": 56.25, - "cache_read": 1.25 - } + "input": 0.29, + "output": 1 }, "type": "chat" }, { - "id": "qwen3-6-27b", - "name": "Qwen 3.6 27B", - "display_name": "Qwen 3.6 27B", + "id": "Qwen/Qwen3-VL-32B-Instruct", + "name": "Qwen/Qwen3-VL-32B-Instruct", + "display_name": "Qwen/Qwen3-VL-32B-Instruct", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-04-29", + "release_date": "2025-10-21", + "last_updated": "2025-11-25", "cost": { - "input": 0.325, - "output": 3.25 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "Qwen/QwQ-32B", + "name": "Qwen/QwQ-32B", + "display_name": "Qwen/QwQ-32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-16", + "release_date": "2025-03-06", + "last_updated": "2025-11-25", "cost": { - "input": 6, - "output": 30, - "cache_read": 0.6, - "cache_write": 7.5 + "input": 0.15, + "output": 0.58 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", "modalities": { "input": [ "text" @@ -93523,41 +101584,28 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-24", - "last_updated": "2026-04-29", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 1.73, - "output": 3.796, - "cache_read": 0.33 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "display_name": "Qwen/Qwen3-235B-A22B-Instruct-2507", "modalities": { "input": [ "text" @@ -93567,78 +101615,59 @@ ] }, "limit": { - "context": 160000, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-10", - "release_date": "2025-12-04", - "last_updated": "2026-03-24", + "open_weights": false, + "release_date": "2025-07-23", + "last_updated": "2025-11-25", "cost": { - "input": 0.33, - "output": 0.48, - "cache_read": 0.16 + "input": 0.09, + "output": 0.6 }, "type": "chat" }, { - "id": "qwen-3-6-plus", - "name": "Qwen 3.6 Plus Uncensored", - "display_name": "Qwen 3.6 Plus Uncensored", + "id": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-04-06", - "last_updated": "2026-04-12", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.625, - "output": 3.75, - "cache_read": 0.0625, - "cache_write": 0.78, - "context_over_200k": { - "input": 2.5, - "output": 7.5, - "cache_read": 0.0625, - "cache_write": 0.78 - } + "input": 0.3, + "output": 1.5 }, "type": "chat" }, { - "id": "aion-labs-aion-2-0", - "name": "Aion 2.0", - "display_name": "Aion 2.0", + "id": "Qwen/Qwen2.5-VL-72B-Instruct", + "name": "Qwen/Qwen2.5-VL-72B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-72B-Instruct", "modalities": { "input": [ "text" @@ -93648,102 +101677,90 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-24", - "last_updated": "2026-04-12", + "release_date": "2025-01-28", + "last_updated": "2025-11-25", "cost": { - "input": 1, - "output": 2, - "cache_read": 0.25 + "input": 0.59, + "output": 0.59 }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 198000, - "output": 64000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-01-15", - "last_updated": "2026-04-12", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 3.75, - "output": 18.75, - "cache_read": 0.375, - "cache_write": 4.69 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "openai-gpt-4o-2024-11-20", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "Qwen/Qwen2.5-14B-Instruct", + "name": "Qwen/Qwen2.5-14B-Instruct", + "display_name": "Qwen/Qwen2.5-14B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-02-28", - "last_updated": "2026-03-06", + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 3.125, - "output": 12.5 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "llama-3.3-70b", - "name": "Llama 3.3 70B", - "display_name": "Llama 3.3 70B", + "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", "modalities": { "input": [ "text" @@ -93753,8 +101770,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -93762,38 +101779,34 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-04-06", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2025-08-01", + "last_updated": "2025-11-25", "cost": { - "input": 0.7, - "output": 2.8 - }, - "type": "chat" + "input": 0.07, + "output": 0.28 + } }, { - "id": "kimi-k2-5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "Qwen/Qwen3-8B", + "name": "Qwen/Qwen3-8B", + "display_name": "Qwen/Qwen3-8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -93806,22 +101819,20 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2026-01-27", - "last_updated": "2026-04-30", + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.56, - "output": 3.5, - "cache_read": 0.22 + "input": 0.06, + "output": 0.06 }, "type": "chat" }, { - "id": "llama-3.2-3b", - "name": "Llama 3.2 3B", - "display_name": "Llama 3.2 3B", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "display_name": "Qwen/Qwen3-30B-A3B-Instruct-2507", "modalities": { "input": [ "text" @@ -93831,8 +101842,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -93840,20 +101851,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-10-03", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2025-07-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.09, + "output": 0.3 }, "type": "chat" }, { - "id": "arcee-trinity-large-thinking", - "name": "Trinity Large Thinking", - "display_name": "Trinity Large Thinking", + "id": "Qwen/Qwen3-32B", + "name": "Qwen/Qwen3-32B", + "display_name": "Qwen/Qwen3-32B", "modalities": { "input": [ "text" @@ -93863,14 +101873,13 @@ ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -93884,20 +101893,19 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-04", + "open_weights": false, + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.3125, - "output": 1.125, - "cache_read": 0.075 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "hermes-3-llama-3.1-405b", - "name": "Hermes 3 Llama 3.1 405b", - "display_name": "Hermes 3 Llama 3.1 405b", + "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "name": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "display_name": "Qwen/Qwen3-Next-80B-A3B-Thinking", "modalities": { "input": [ "text" @@ -93907,83 +101915,82 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", + "open_weights": false, "release_date": "2025-09-25", - "last_updated": "2026-03-12", + "last_updated": "2025-11-25", "cost": { - "input": 1.1, - "output": 3 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "gemini-3-1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-02-19", - "last_updated": "2026-03-12", + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.5, - "cache_write": 0.5, - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "input": 0.14, + "output": 1.4 }, "type": "chat" }, { - "id": "kimi-k2-6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "name": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "display_name": "Qwen/Qwen3-VL-235B-A22B-Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -94003,82 +102010,62 @@ } }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-20", - "last_updated": "2026-04-30", + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.85, - "output": 4.655, - "cache_read": 0.22 + "input": 0.45, + "output": 3.5 }, "type": "chat" }, { - "id": "claude-opus-4-6-fast", - "name": "Claude Opus 4.6 Fast", - "display_name": "Claude Opus 4.6 Fast", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen/Qwen3-235B-A22B-Thinking-2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "release_date": "2025-07-28", + "last_updated": "2025-11-25", "cost": { - "input": 36, - "output": 180, - "cache_read": 3.6, - "cache_write": 45 + "input": 0.13, + "output": 0.6 }, "type": "chat" }, { - "id": "z-ai-glm-5-turbo", - "name": "GLM 5 Turbo", - "display_name": "GLM 5 Turbo", + "id": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", "modalities": { "input": [ "text" @@ -94088,8 +102075,8 @@ ] }, "limit": { - "context": 200000, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -94097,63 +102084,62 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-15", - "last_updated": "2026-04-12", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "google-gemma-4-31b-it", - "name": "Google Gemma 4 31B Instruct", - "display_name": "Google Gemma 4 31B Instruct", + "id": "inclusionAI/Ling-mini-2.0", + "name": "inclusionAI/Ling-mini-2.0", + "display_name": "inclusionAI/Ling-mini-2.0", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 131072, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-03", - "last_updated": "2026-04-12", + "attachment": false, + "open_weights": false, + "release_date": "2025-09-10", + "last_updated": "2025-11-25", "cost": { - "input": 0.175, - "output": 0.5 + "input": 0.07, + "output": 0.28 }, "type": "chat" - } - ] - }, - "cerebras": { - "id": "cerebras", - "name": "Cerebras", - "display_name": "Cerebras", - "doc": "https://inference-docs.cerebras.ai/models/overview", - "models": [ + }, { - "id": "llama3.1-8b", - "name": "Llama 3.1 8B", - "display_name": "Llama 3.1 8B", + "id": "inclusionAI/Ling-flash-2.0", + "name": "inclusionAI/Ling-flash-2.0", + "display_name": "inclusionAI/Ling-flash-2.0", "modalities": { "input": [ "text" @@ -94163,8 +102149,8 @@ ] }, "limit": { - "context": 32000, - "output": 8000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -94172,20 +102158,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": false, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "qwen-3-235b-a22b-instruct-2507", - "name": "Qwen 3 235B Instruct", - "display_name": "Qwen 3 235B Instruct", + "id": "inclusionAI/Ring-flash-2.0", + "name": "inclusionAI/Ring-flash-2.0", + "display_name": "inclusionAI/Ring-flash-2.0", "modalities": { "input": [ "text" @@ -94195,29 +102180,34 @@ ] }, "limit": { - "context": 131000, - "output": 32000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-22", - "last_updated": "2025-07-22", + "open_weights": false, + "release_date": "2025-09-29", + "last_updated": "2025-11-25", "cost": { - "input": 0.6, - "output": 1.2 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "zai-glm-4.7", - "name": "Z.AI GLM-4.7", - "display_name": "Z.AI GLM-4.7", + "id": "deepseek-ai/DeepSeek-V3.2-Exp", + "name": "deepseek-ai/DeepSeek-V3.2-Exp", + "display_name": "deepseek-ai/DeepSeek-V3.2-Exp", "modalities": { "input": [ "text" @@ -94228,29 +102218,18 @@ }, "limit": { "context": 131072, - "output": 40000 + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-01-10", - "last_updated": "2026-01-10", - "cost": { - "input": 2.25, - "output": 2.75, - "cache_read": 0, - "cache_write": 0 - }, "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", + "name": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", + "display_name": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", "modalities": { "input": [ "text" @@ -94261,42 +102240,18 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 0.25, - "output": 0.69 + "supported": false }, "type": "chat" - } - ] - }, - "lmstudio": { - "id": "lmstudio", - "name": "LMStudio", - "display_name": "LMStudio", - "api": "http://127.0.0.1:1234/v1", - "doc": "https://lmstudio.ai/models", - "models": [ + }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "inclusionAI/Ring-1T", + "name": "inclusionAI/Ring-1T", + "display_name": "inclusionAI/Ring-1T", "modalities": { "input": [ "text" @@ -94307,9 +102262,8 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -94320,20 +102274,12 @@ "supported": true } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "qwen/qwen3-coder-30b", - "name": "Qwen3 Coder 30B", - "display_name": "Qwen3 Coder 30B", + "id": "inclusionAI/Ling-1T", + "name": "inclusionAI/Ling-1T", + "display_name": "inclusionAI/Ling-1T", "modalities": { "input": [ "text" @@ -94343,29 +102289,107 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b-2507", - "name": "Qwen3 30B A3B 2507", - "display_name": "Qwen3 30B A3B 2507", + "id": "Qwen/Qwen-Image-Edit-2509", + "name": "Qwen/Qwen-Image-Edit-2509", + "display_name": "Qwen/Qwen-Image-Edit-2509", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "image" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "Qwen/Qwen-Image-Edit", + "name": "Qwen/Qwen-Image-Edit", + "display_name": "Qwen/Qwen-Image-Edit", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "image" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "Qwen/Qwen-Image", + "name": "Qwen/Qwen-Image", + "display_name": "Qwen/Qwen-Image", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "Wan-AI/Wan2.2-I2V-A14B", + "name": "Wan-AI/Wan2.2-I2V-A14B", + "display_name": "Wan-AI/Wan2.2-I2V-A14B", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "video" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "Wan-AI/Wan2.2-T2V-A14B", + "name": "Wan-AI/Wan2.2-T2V-A14B", + "display_name": "Wan-AI/Wan2.2-T2V-A14B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "video" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "zai-org/GLM-4.5", + "name": "zai-org/GLM-4.5", + "display_name": "zai-org/GLM-4.5", "modalities": { "input": [ "text" @@ -94375,38 +102399,19 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-30", - "last_updated": "2025-07-30", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" - } - ] - }, - "lucidquery": { - "id": "lucidquery", - "name": "LucidQuery AI", - "display_name": "LucidQuery AI", - "api": "https://lucidquery.com/api/v1", - "doc": "https://lucidquery.com/api/docs", - "models": [ + }, { - "id": "lucidnova-rf1-100b", - "name": "LucidNova RF1 100B", - "display_name": "LucidNova RF1 100B", + "id": "stepfun-ai/step3", + "name": "stepfun-ai/step3", + "display_name": "stepfun-ai/step3", "modalities": { "input": [ "text" @@ -94416,30 +102421,36 @@ ] }, "limit": { - "context": 120000, - "output": 8000 + "context": 131072, + "output": 8192 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-09-16", - "release_date": "2024-12-28", - "last_updated": "2025-09-10", - "cost": { - "input": 2, - "output": 5 + "supported": false }, "type": "chat" }, { - "id": "lucidquery-nexus-coder", - "name": "LucidQuery Nexus Coder", - "display_name": "LucidQuery Nexus Coder", + "id": "TeleAI/TeleSpeechASR", + "name": "TeleAI/TeleSpeechASR", + "display_name": "TeleAI/TeleSpeechASR", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "THUDM/GLM-4.1V-9B-Thinking", + "name": "THUDM/GLM-4.1V-9B-Thinking", + "display_name": "THUDM/GLM-4.1V-9B-Thinking", "modalities": { "input": [ "text" @@ -94449,39 +102460,20 @@ ] }, "limit": { - "context": 250000, - "output": 60000 + "context": 131072, + "output": 8192 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-01", - "release_date": "2025-09-01", - "last_updated": "2025-09-01", - "cost": { - "input": 2, - "output": 5 - }, "type": "chat" - } - ] - }, - "moonshot": { - "id": "moonshot", - "name": "Moonshot AI (China)", - "display_name": "Moonshot AI (China)", - "api": "https://api.moonshot.cn/v1", - "doc": "https://platform.moonshot.cn/docs/api/chat", - "models": [ + }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "Pro/THUDM/GLM-4.1V-9B-Thinking", + "name": "Pro/THUDM/GLM-4.1V-9B-Thinking", + "display_name": "Pro/THUDM/GLM-4.1V-9B-Thinking", "modalities": { "input": [ "text" @@ -94491,42 +102483,20 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", - "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 - }, "type": "chat" }, { - "id": "kimi-k2-0711-preview", - "name": "Kimi K2 0711", - "display_name": "Kimi K2 0711", + "id": "moonshotai/Kimi-Dev-72B", + "name": "moonshotai/Kimi-Dev-72B", + "display_name": "moonshotai/Kimi-Dev-72B", "modalities": { "input": [ "text" @@ -94537,29 +102507,18 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-14", - "last_updated": "2025-07-14", - "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 - }, "type": "chat" }, { - "id": "kimi-k2-turbo-preview", - "name": "Kimi K2 Turbo", - "display_name": "Kimi K2 Turbo", + "id": "MiniMaxAI/MiniMax-M1-80k", + "name": "MiniMaxAI/MiniMax-M1-80k", + "display_name": "MiniMaxAI/MiniMax-M1-80k", "modalities": { "input": [ "text" @@ -94569,77 +102528,42 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", - "cost": { - "input": 2.4, - "output": 10, - "cache_read": 0.6 - }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "Tongyi-Zhiwen/QwenLong-L1-32B", + "name": "Tongyi-Zhiwen/QwenLong-L1-32B", + "display_name": "Tongyi-Zhiwen/QwenLong-L1-32B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", - "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 - }, "type": "chat" }, { - "id": "kimi-k2-thinking-turbo", - "name": "Kimi K2 Thinking Turbo", - "display_name": "Kimi K2 Thinking Turbo", + "id": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", + "name": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", + "display_name": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", "modalities": { "input": [ "text" @@ -94649,61 +102573,35 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", - "cost": { - "input": 1.15, - "output": 8, - "cache_read": 0.15 - }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "Qwen/Qwen3-30B-A3B", + "name": "Qwen/Qwen3-30B-A3B", + "display_name": "Qwen/Qwen3-30B-A3B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 8192 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -94716,340 +102614,199 @@ ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", - "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 - }, "type": "chat" }, { - "id": "kimi-k2-0905-preview", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "Qwen/Qwen3-Reranker-8B", + "name": "Qwen/Qwen3-Reranker-8B", + "display_name": "Qwen/Qwen3-Reranker-8B", "modalities": { "input": [ "text" ], "output": [ - "text" + "score" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", - "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 - }, - "type": "chat" - } - ] - }, - "azure-cognitive-services": { - "id": "azure-cognitive-services", - "name": "Azure Cognitive Services", - "display_name": "Azure Cognitive Services", - "doc": "https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models", - "models": [ + "type": "rerank" + }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "Qwen/Qwen3-Embedding-8B", + "name": "Qwen/Qwen3-Embedding-8B", + "display_name": "Qwen/Qwen3-Embedding-8B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text" + "embedding" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", - "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "supported": false }, - "type": "chat" + "type": "embedding" }, { - "id": "claude-opus-4-1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "Qwen/Qwen3-Reranker-4B", + "name": "Qwen/Qwen3-Reranker-4B", + "display_name": "Qwen/Qwen3-Reranker-4B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text" + "score" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", - "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "supported": false }, - "type": "chat" + "type": "rerank" }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "Qwen/Qwen3-Embedding-4B", + "name": "Qwen/Qwen3-Embedding-4B", + "display_name": "Qwen/Qwen3-Embedding-4B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text" + "embedding" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", - "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "supported": false }, - "type": "chat" + "type": "embedding" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "Qwen/Qwen3-Reranker-0.6B", + "name": "Qwen/Qwen3-Reranker-0.6B", + "display_name": "Qwen/Qwen3-Reranker-0.6B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "score" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true - } + "type": "rerank" + }, + { + "id": "Qwen/Qwen3-Embedding-0.6B", + "name": "Qwen/Qwen3-Embedding-0.6B", + "display_name": "Qwen/Qwen3-Embedding-0.6B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "embedding" + ] }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", - "cost": { - "input": 0.95, - "output": 4 + "limit": { + "context": 8192, + "output": 2048 }, - "type": "chat" + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "Qwen/Qwen3-235B-A22B", + "name": "Qwen/Qwen3-235B-A22B", + "display_name": "Qwen/Qwen3-235B-A22B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", - "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25, - "context_over_200k": { - "input": 10, - "output": 37.5, - "cache_read": 1, - "cache_write": 12.5 - } - }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", + "name": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", + "display_name": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "supported": false }, "type": "chat" }, { - "id": "mai-ds-r1", - "name": "MAI-DS-R1", - "display_name": "MAI-DS-R1", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", "modalities": { "input": [ "text" @@ -95059,63 +102816,43 @@ ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", - "cost": { - "input": 1.35, - "output": 5.4 - }, "type": "chat" }, { - "id": "llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama 4 Maverick 17B 128E Instruct FP8", - "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", + "id": "Qwen/QVQ-72B-Preview", + "name": "Qwen/QVQ-72B-Preview", + "display_name": "Qwen/QVQ-72B-Preview", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", - "cost": { - "input": 0.25, - "output": 1 + "supported": true, + "default": true }, "type": "chat" }, { - "id": "codestral-2501", - "name": "Codestral 25.01", - "display_name": "Codestral 25.01", + "id": "deepseek-ai/DeepSeek-V2.5", + "name": "deepseek-ai/DeepSeek-V2.5", + "display_name": "deepseek-ai/DeepSeek-V2.5", "modalities": { "input": [ "text" @@ -95125,88 +102862,87 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0.3, - "output": 0.9 - }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "fnlp/MOSS-TTSD-v0.5", + "name": "fnlp/MOSS-TTSD-v0.5", + "display_name": "fnlp/MOSS-TTSD-v0.5", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "image", "audio" ] }, - "limit": { - "context": 400000, - "output": 128000 - }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false + "supported": false + } + }, + { + "id": "FunAudioLLM/CosyVoice2-0.5B", + "name": "FunAudioLLM/CosyVoice2-0.5B", + "display_name": "FunAudioLLM/CosyVoice2-0.5B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "FunAudioLLM/SenseVoiceSmall", + "name": "FunAudioLLM/SenseVoiceSmall", + "display_name": "FunAudioLLM/SenseVoiceSmall", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "IndexTeam/IndexTTS-2", + "name": "IndexTeam/IndexTTS-2", + "display_name": "IndexTeam/IndexTTS-2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] }, - "type": "chat" + "tool_call": false, + "reasoning": { + "supported": false + } }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "BAAI/bge-m3", + "name": "BAAI/bge-m3", + "display_name": "BAAI/bge-m3", "modalities": { "input": [ "text" @@ -95216,151 +102952,123 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-12-02", - "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "supported": false }, - "type": "chat" + "type": "embedding" }, { - "id": "deepseek-r1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "BAAI/bge-reranker-v2-m3", + "name": "BAAI/bge-reranker-v2-m3", + "display_name": "BAAI/bge-reranker-v2-m3", "modalities": { "input": [ "text" ], "output": [ - "text" + "score" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", - "cost": { - "input": 1.35, - "output": 5.4 + "supported": false }, - "type": "chat" + "type": "rerank" }, { - "id": "gpt-3.5-turbo-instruct", - "name": "GPT-3.5 Turbo Instruct", - "display_name": "GPT-3.5 Turbo Instruct", + "id": "netease-youdao/bce-embedding-base_v1", + "name": "netease-youdao/bce-embedding-base_v1", + "display_name": "netease-youdao/bce-embedding-base_v1", "modalities": { "input": [ "text" ], "output": [ - "text" + "embedding" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 8192, + "output": 2048 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-09-21", - "last_updated": "2023-09-21", - "cost": { - "input": 1.5, - "output": 2 + "type": "embedding" + }, + { + "id": "netease-youdao/bce-reranker-base_v1", + "name": "netease-youdao/bce-reranker-base_v1", + "display_name": "netease-youdao/bce-reranker-base_v1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "score" + ] }, - "type": "chat" + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + } }, { - "id": "mistral-medium-2505", - "name": "Mistral Medium 3", - "display_name": "Mistral Medium 3", + "id": "Kwai-Kolors/Kolors", + "name": "Kwai-Kolors/Kolors", + "display_name": "Kwai-Kolors/Kolors", "modalities": { "input": [ - "text", + "text" + ], + "output": [ "image" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "Qwen/Qwen2-VL-72B-Instruct", + "name": "Qwen/Qwen2-VL-72B-Instruct", + "display_name": "Qwen/Qwen2-VL-72B-Instruct", + "modalities": { + "input": [ + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", - "cost": { - "input": 0.4, - "output": 2 - }, "type": "chat" }, { - "id": "phi-4-reasoning-plus", - "name": "Phi-4-reasoning-plus", - "display_name": "Phi-4-reasoning-plus", + "id": "Qwen/Qwen2.5-Coder-7B-Instruct", + "name": "Qwen/Qwen2.5-Coder-7B-Instruct", + "display_name": "Qwen/Qwen2.5-Coder-7B-Instruct", "modalities": { "input": [ "text" @@ -95370,30 +103078,18 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 131072, + "output": 8192 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", - "cost": { - "input": 0.125, - "output": 0.5 - }, - "type": "chat" + "supported": false + } }, { - "id": "cohere-embed-v3-english", - "name": "Embed v3 English", - "display_name": "Embed v3 English", + "id": "internlm/internlm2_5-7b-chat", + "name": "internlm/internlm2_5-7b-chat", + "display_name": "internlm/internlm2_5-7b-chat", "modalities": { "input": [ "text" @@ -95403,28 +103099,19 @@ ] }, "limit": { - "context": 512, - "output": 1024 + "context": 131072, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", - "cost": { - "input": 0.1, - "output": 0 - }, "type": "chat" }, { - "id": "gpt-4-32k", - "name": "GPT-4 32K", - "display_name": "GPT-4 32K", + "id": "Qwen/Qwen2-7B-Instruct", + "name": "Qwen/Qwen2-7B-Instruct", + "display_name": "Qwen/Qwen2-7B-Instruct", "modalities": { "input": [ "text" @@ -95434,85 +103121,41 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", - "cost": { - "input": 60, - "output": 120 - }, "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "THUDM/glm-4-9b-chat", + "name": "THUDM/glm-4-9b-chat", + "display_name": "THUDM/glm-4-9b-chat", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "supported": false }, "type": "chat" }, { - "id": "phi-4", - "name": "Phi-4", - "display_name": "Phi-4", + "id": "BAAI/bge-large-en-v1.5", + "name": "BAAI/bge-large-en-v1.5", + "display_name": "BAAI/bge-large-en-v1.5", "modalities": { "input": [ "text" @@ -95522,29 +103165,19 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", - "cost": { - "input": 0.125, - "output": 0.5 - }, - "type": "chat" + "type": "embedding" }, { - "id": "gpt-3.5-turbo-0613", - "name": "GPT-3.5 Turbo 0613", - "display_name": "GPT-3.5 Turbo 0613", + "id": "BAAI/bge-large-zh-v1.5", + "name": "BAAI/bge-large-zh-v1.5", + "display_name": "BAAI/bge-large-zh-v1.5", "modalities": { "input": [ "text" @@ -95554,29 +103187,19 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 131072, + "output": 8192 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-06-13", - "last_updated": "2023-06-13", - "cost": { - "input": 3, - "output": 4 - }, - "type": "chat" + "type": "embedding" }, { - "id": "phi-3-medium-128k-instruct", - "name": "Phi-3-medium-instruct (128k)", - "display_name": "Phi-3-medium-instruct (128k)", + "id": "LoRA/Qwen/Qwen2.5-32B-Instruct", + "name": "LoRA/Qwen/Qwen2.5-32B-Instruct", + "display_name": "LoRA/Qwen/Qwen2.5-32B-Instruct", "modalities": { "input": [ "text" @@ -95586,29 +103209,19 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", - "cost": { - "input": 0.17, - "output": 0.68 - }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "LoRA/Qwen/Qwen2.5-14B-Instruct", + "name": "LoRA/Qwen/Qwen2.5-14B-Instruct", + "display_name": "LoRA/Qwen/Qwen2.5-14B-Instruct", "modalities": { "input": [ "text" @@ -95618,35 +103231,19 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", - "cost": { - "input": 0.58, - "output": 1.68 + "supported": false }, "type": "chat" }, { - "id": "phi-3-small-128k-instruct", - "name": "Phi-3-small-instruct (128k)", - "display_name": "Phi-3-small-instruct (128k)", + "id": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "name": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "display_name": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", "modalities": { "input": [ "text" @@ -95656,29 +103253,20 @@ ] }, "limit": { - "context": 128000, - "output": 4096 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false + "context": 131072, + "output": 8192 }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", - "cost": { - "input": 0.15, - "output": 0.6 + "tool_call": true, + "reasoning": { + "supported": true, + "default": true }, "type": "chat" }, { - "id": "gpt-3.5-turbo-0301", - "name": "GPT-3.5 Turbo 0301", - "display_name": "GPT-3.5 Turbo 0301", + "id": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", + "name": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", + "display_name": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", "modalities": { "input": [ "text" @@ -95688,29 +103276,18 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 131072, + "output": 8192 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-03-01", - "last_updated": "2023-03-01", - "cost": { - "input": 1.5, - "output": 2 - }, - "type": "chat" + } }, { - "id": "phi-4-mini", - "name": "Phi-4-mini", - "display_name": "Phi-4-mini", + "id": "Pro/BAAI/bge-m3", + "name": "Pro/BAAI/bge-m3", + "display_name": "Pro/BAAI/bge-m3", "modalities": { "input": [ "text" @@ -95720,117 +103297,63 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", - "cost": { - "input": 0.075, - "output": 0.3 - }, - "type": "chat" + "type": "embedding" }, { - "id": "gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "Pro/Qwen/Qwen2.5-7B-Instruct", + "name": "Pro/Qwen/Qwen2.5-7B-Instruct", + "display_name": "Pro/Qwen/Qwen2.5-7B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "supported": false }, "type": "chat" }, { - "id": "meta-llama-3-8b-instruct", - "name": "Meta-Llama-3-8B-Instruct", - "display_name": "Meta-Llama-3-8B-Instruct", + "id": "Pro/BAAI/bge-reranker-v2-m3", + "name": "Pro/BAAI/bge-reranker-v2-m3", + "display_name": "Pro/BAAI/bge-reranker-v2-m3", "modalities": { "input": [ "text" ], "output": [ - "text" + "score" ] }, "limit": { "context": 8192, "output": 2048 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", - "cost": { - "input": 0.3, - "output": 0.61 - }, - "type": "chat" + "type": "rerank" }, { - "id": "gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "LoRA/Qwen/Qwen2.5-72B-Instruct", + "name": "LoRA/Qwen/Qwen2.5-72B-Instruct", + "display_name": "LoRA/Qwen/Qwen2.5-72B-Instruct", "modalities": { "input": [ "text" @@ -95840,29 +103363,19 @@ ] }, "limit": { - "context": 8192, + "context": 131072, "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", - "cost": { - "input": 60, - "output": 120 - }, "type": "chat" }, { - "id": "phi-4-mini-reasoning", - "name": "Phi-4-mini-reasoning", - "display_name": "Phi-4-mini-reasoning", + "id": "Pro/Qwen/Qwen2-7B-Instruct", + "name": "Pro/Qwen/Qwen2-7B-Instruct", + "display_name": "Pro/Qwen/Qwen2-7B-Instruct", "modalities": { "input": [ "text" @@ -95872,30 +103385,19 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", - "cost": { - "input": 0.075, - "output": 0.3 + "supported": false }, "type": "chat" }, { - "id": "meta-llama-3.1-70b-instruct", - "name": "Meta-Llama-3.1-70B-Instruct", - "display_name": "Meta-Llama-3.1-70B-Instruct", + "id": "LoRA/Qwen/Qwen2.5-7B-Instruct", + "name": "LoRA/Qwen/Qwen2.5-7B-Instruct", + "display_name": "LoRA/Qwen/Qwen2.5-7B-Instruct", "modalities": { "input": [ "text" @@ -95905,29 +103407,19 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 2.68, - "output": 3.54 - }, "type": "chat" }, { - "id": "phi-3-mini-4k-instruct", - "name": "Phi-3-mini-instruct (4k)", - "display_name": "Phi-3-mini-instruct (4k)", + "id": "Pro/THUDM/glm-4-9b-chat", + "name": "Pro/THUDM/glm-4-9b-chat", + "display_name": "Pro/THUDM/glm-4-9b-chat", "modalities": { "input": [ "text" @@ -95937,29 +103429,19 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 131072, + "output": 8192 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", - "cost": { - "input": 0.13, - "output": 0.52 - }, "type": "chat" }, { - "id": "deepseek-v3.1", - "name": "DeepSeek-V3.1", - "display_name": "DeepSeek-V3.1", + "id": "THUDM/GLM-Z1-Rumination-32B-0414", + "name": "THUDM/GLM-Z1-Rumination-32B-0414", + "display_name": "THUDM/GLM-Z1-Rumination-32B-0414", "modalities": { "input": [ "text" @@ -95970,169 +103452,233 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", - "cost": { - "input": 0.56, - "output": 1.68 - }, "type": "chat" }, { - "id": "text-embedding-3-small", - "name": "text-embedding-3-small", - "display_name": "text-embedding-3-small", + "id": "stabilityai/stable-diffusion-xl-base-1.0", + "name": "stabilityai/stable-diffusion-xl-base-1.0", + "display_name": "stabilityai/stable-diffusion-xl-base-1.0", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, - "limit": { - "context": 8191, - "output": 1536 - }, "tool_call": false, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", - "cost": { - "input": 0.02, - "output": 0 - }, - "type": "embedding" + } }, { - "id": "gpt-3.5-turbo-1106", - "name": "GPT-3.5 Turbo 1106", - "display_name": "GPT-3.5 Turbo 1106", + "id": "black-forest-labs/FLUX.1-schnell", + "name": "black-forest-labs/FLUX.1-schnell", + "display_name": "black-forest-labs/FLUX.1-schnell", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, - "limit": { - "context": 16384, - "output": 16384 - }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false + } + }, + { + "id": "black-forest-labs/FLUX.1-dev", + "name": "black-forest-labs/FLUX.1-dev", + "display_name": "black-forest-labs/FLUX.1-dev", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] }, - "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-11-06", - "last_updated": "2023-11-06", - "cost": { - "input": 1, - "output": 2 - }, - "type": "chat" + "tool_call": false, + "reasoning": { + "supported": false + } }, { - "id": "model-router", - "name": "Model Router", - "display_name": "Model Router", + "id": "Pro/black-forest-labs/FLUX.1-schnell", + "name": "Pro/black-forest-labs/FLUX.1-schnell", + "display_name": "Pro/black-forest-labs/FLUX.1-schnell", "modalities": { "input": [ - "text", + "text" + ], + "output": [ "image" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "stabilityai/stable-diffusion-3-5-large", + "name": "stabilityai/stable-diffusion-3-5-large", + "display_name": "stabilityai/stable-diffusion-3-5-large", + "modalities": { + "input": [ + "text" ], "output": [ + "image" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "fishaudio/fish-speech-1.4", + "name": "fishaudio/fish-speech-1.4", + "display_name": "fishaudio/fish-speech-1.4", + "modalities": { + "input": [ "text" + ], + "output": [ + "audio" ] }, - "limit": { - "context": 128000, - "output": 16384 + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "RVC-Boss/GPT-SoVITS", + "name": "RVC-Boss/GPT-SoVITS", + "display_name": "RVC-Boss/GPT-SoVITS", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false + } + }, + { + "id": "fishaudio/fish-speech-1.5", + "name": "fishaudio/fish-speech-1.5", + "display_name": "fishaudio/fish-speech-1.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-19", - "last_updated": "2025-11-18", - "cost": { - "input": 0.14, - "output": 0 + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "black-forest-labs/FLUX.1-pro", + "name": "black-forest-labs/FLUX.1-pro", + "display_name": "black-forest-labs/FLUX.1-pro", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] }, - "type": "chat" + "tool_call": false, + "reasoning": { + "supported": false + } }, { - "id": "mistral-small-2503", - "name": "Mistral Small 3.1", - "display_name": "Mistral Small 3.1", + "id": "LoRA/black-forest-labs/FLUX.1-dev", + "name": "LoRA/black-forest-labs/FLUX.1-dev", + "display_name": "LoRA/black-forest-labs/FLUX.1-dev", "modalities": { "input": [ - "text", + "text" + ], + "output": [ "image" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "SeedLLM/Seed-Rice-7B", + "name": "SeedLLM/Seed-Rice-7B", + "display_name": "SeedLLM/Seed-Rice-7B", + "modalities": { + "input": [ + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-03-01", - "last_updated": "2025-03-01", - "cost": { - "input": 0.1, - "output": 0.3 - }, "type": "chat" - }, + } + ] + }, + "nvidia": { + "id": "nvidia", + "name": "Nvidia", + "display_name": "Nvidia", + "api": "https://integrate.api.nvidia.com/v1", + "doc": "https://docs.api.nvidia.com/nim/", + "models": [ { - "id": "o1", - "name": "o1", - "display_name": "o1", + "id": "deepseek-ai/deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 163840, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -96140,46 +103686,35 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-4-fast-reasoning", - "name": "Grok 4 Fast (Reasoning)", - "display_name": "Grok 4 Fast (Reasoning)", + "id": "deepseek-ai/deepseek-v3.1-terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -96187,86 +103722,57 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "knowledge": "2025-01", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "bytedance/seed-oss-36b-instruct", + "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "release_date": "2025-09-04", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "cohere-embed-v3-multilingual", - "name": "Embed v3 Multilingual", - "display_name": "Embed v3 Multilingual", + "id": "moonshotai/kimi-k2-instruct-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -96276,28 +103782,29 @@ ] }, "limit": { - "context": 512, - "output": 1024 + "context": 262144, + "output": 262144 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.1, + "input": 0, "output": 0 }, "type": "chat" }, { - "id": "o1-preview", - "name": "o1-preview", - "display_name": "o1-preview", + "id": "moonshotai/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -96308,44 +103815,29 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "knowledge": "2024-01", + "release_date": "2025-01-01", + "last_updated": "2025-09-05", "cost": { - "input": 16.5, - "output": 66, - "cache_read": 8.25 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-0125", - "name": "GPT-3.5 Turbo 0125", - "display_name": "GPT-3.5 Turbo 0125", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -96355,131 +103847,145 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-11", + "last_updated": "2025-12", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex Mini", - "display_name": "GPT-5.1 Codex Mini", + "id": "moonshotai/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "cohere-embed-v-4-0", - "name": "Embed v4", - "display_name": "Embed v4", + "id": "z-ai/glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 1536 + "context": 131072, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.12, + "input": 0, "output": 0 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "z-ai/glm4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -96488,111 +103994,98 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-4-turbo-vision", - "name": "GPT-4 Turbo Vision", - "display_name": "GPT-4 Turbo Vision", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 10, - "output": 30 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.1-chat", - "name": "GPT-5.1 Chat", - "display_name": "GPT-5.1 Chat", + "id": "openai/whisper-large-v3", + "name": "Whisper Large v3", + "display_name": "Whisper Large v3", "modalities": { "input": [ - "text", - "image", "audio" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8192, + "output": 4096 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "attachment": false, + "open_weights": true, + "knowledge": "2023-09", + "release_date": "2023-09-01", + "last_updated": "2025-09-05", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta-llama-3.1-405b-instruct", - "name": "Meta-Llama-3.1-405B-Instruct", - "display_name": "Meta-Llama-3.1-405B-Instruct", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS-120B", + "display_name": "GPT-OSS-120B", "modalities": { "input": [ "text" @@ -96603,221 +104096,163 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08", + "release_date": "2025-08-04", + "last_updated": "2025-08-14", "cost": { - "input": 5.33, - "output": 16 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "llama-3.2-11b-vision-instruct", - "name": "Llama-3.2-11B-Vision-Instruct", - "display_name": "Llama-3.2-11B-Vision-Instruct", + "id": "black-forest-labs/flux_1-kontext-dev", + "name": "FLUX.1-Kontext-dev", + "display_name": "FLUX.1-Kontext-dev", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 40960, + "output": 40960 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "release_date": "2025-08-12", + "last_updated": "2025-08-12", "cost": { - "input": 0.37, - "output": 0.37 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "cohere-command-a", - "name": "Command A", - "display_name": "Command A", + "id": "black-forest-labs/flux_1-schnell", + "name": "FLUX.1-schnell", + "display_name": "FLUX.1-schnell", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 256000, - "output": 8000 + "context": 77, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "knowledge": "2024-07", + "release_date": "2024-08-01", + "last_updated": "2026-02-04", "cost": { - "input": 2.5, - "output": 10 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mistral-large-2411", - "name": "Mistral Large 24.11", - "display_name": "Mistral Large 24.11", + "id": "black-forest-labs/flux.1-dev", + "name": "FLUX.1-dev", + "display_name": "FLUX.1-dev", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 4096, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", - "cost": { - "input": 2, - "output": 6 - }, - "type": "chat" - }, - { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 400000, - "output": 128000 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-08-01", + "last_updated": "2025-09-05", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.125 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-v3.2-speciale", - "name": "DeepSeek-V3.2-Speciale", - "display_name": "DeepSeek-V3.2-Speciale", + "id": "black-forest-labs/flux_2-klein-4b", + "name": "FLUX.2 Klein 4B", + "display_name": "FLUX.2 Klein 4B", "modalities": { "input": [ + "image", "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 40960, + "output": 40960 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2025-06", + "release_date": "2026-01-14", + "last_updated": "2026-01-31", "cost": { - "input": 0.58, - "output": 1.68 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "nvidia/usdvalidate", + "name": "usdvalidate", + "display_name": "usdvalidate", "modalities": { "input": [ "text" @@ -96827,74 +104262,60 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 8192, + "output": 4096 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2024-07-24", + "last_updated": "2025-01-08", "cost": { - "input": 1.35, - "output": 5.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "llama-3.2-90b-vision-instruct", - "name": "Llama-3.2-90B-Vision-Instruct", - "display_name": "Llama-3.2-90B-Vision-Instruct", + "id": "nvidia/magpie-tts-zeroshot", + "name": "magpie-tts-zeroshot", + "display_name": "magpie-tts-zeroshot", "modalities": { "input": [ "text", - "image" + "audio" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 8192, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "release_date": "2025-05-22", + "last_updated": "2025-06-12", "cost": { - "input": 2.04, - "output": 2.04 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "text-embedding-ada-002", - "name": "text-embedding-ada-002", - "display_name": "text-embedding-ada-002", + "id": "nvidia/gliner-pii", + "name": "gliner-pii", + "display_name": "gliner-pii", "modalities": { "input": [ "text" @@ -96904,115 +104325,90 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 128000, + "output": 4096 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2022-12-15", - "last_updated": "2022-12-15", + "open_weights": true, + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.1, + "input": 0, "output": 0 }, - "type": "embedding" + "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "nvidia/active-speaker-detection", + "name": "Active Speaker Detection", + "display_name": "Active Speaker Detection", "modalities": { "input": [ - "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 4096 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "phi-3-small-8k-instruct", - "name": "Phi-3-small-instruct (8k)", - "display_name": "Phi-3-small-instruct (8k)", + "id": "nvidia/sparsedrive", + "name": "sparsedrive", + "display_name": "sparsedrive", "modalities": { "input": [ - "text" + "video" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "release_date": "2025-03-18", + "last_updated": "2025-07-20", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta-llama-3-70b-instruct", - "name": "Meta-Llama-3-70B-Instruct", - "display_name": "Meta-Llama-3-70B-Instruct", + "id": "nvidia/nemotron-content-safety-reasoning-4b", + "name": "nemotron-content-safety-reasoning-4b", + "display_name": "nemotron-content-safety-reasoning-4b", "modalities": { "input": [ "text" @@ -97022,141 +104418,93 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 4096 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", "cost": { - "input": 2.68, - "output": 3.54 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "nvidia/nv-embed-v1", + "name": "nv-embed-v1", + "display_name": "nv-embed-v1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 32768, + "output": 2048 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "release_date": "2024-06-07", + "last_updated": "2025-07-22", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "nvidia/cosmos-transfer1-7b", + "name": "cosmos-transfer1-7b", + "display_name": "cosmos-transfer1-7b", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 8192, + "output": 4096 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "release_date": "2025-06-13", + "last_updated": "2025-06-30", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "phi-4-reasoning", - "name": "Phi-4-reasoning", - "display_name": "Phi-4-reasoning", + "id": "nvidia/nv-embedcode-7b-v1", + "name": "nv-embedcode-7b-v1", + "display_name": "nv-embedcode-7b-v1", "modalities": { "input": [ "text" @@ -97166,30 +104514,28 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 32768, + "output": 2048 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2025-03-17", + "last_updated": "2025-05-29", "cost": { - "input": 0.125, - "output": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "phi-3-mini-128k-instruct", - "name": "Phi-3-mini-instruct (128k)", - "display_name": "Phi-3-mini-instruct (128k)", + "id": "nvidia/nvidia-nemotron-nano-9b-v2", + "name": "nvidia-nemotron-nano-9b-v2", + "display_name": "nvidia-nemotron-nano-9b-v2", "modalities": { "input": [ "text" @@ -97199,117 +104545,108 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2024-09", + "release_date": "2025-08-18", + "last_updated": "2025-08-18", "cost": { - "input": 0.13, - "output": 0.52 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "text-embedding-3-large", - "name": "text-embedding-3-large", - "display_name": "text-embedding-3-large", + "id": "nvidia/cosmos-predict1-5b", + "name": "cosmos-predict1-5b", + "display_name": "cosmos-predict1-5b", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 8191, - "output": 3072 + "context": 8192, + "output": 4096 }, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "attachment": true, + "open_weights": true, + "release_date": "2025-03-18", + "last_updated": "2025-03-18", "cost": { - "input": 0.13, + "input": 0, "output": 0 }, - "type": "embedding" + "type": "chat" }, { - "id": "o1-mini", - "name": "o1-mini", - "display_name": "o1-mini", + "id": "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning", + "name": "Nemotron 3 Nano Omni", + "display_name": "Nemotron 3 Nano Omni", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 256000, "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-28", + "last_updated": "2026-04-28", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "phi-3.5-moe-instruct", - "name": "Phi-3.5-MoE-instruct", - "display_name": "Phi-3.5-MoE-instruct", + "id": "nvidia/synthetic-video-detector", + "name": "synthetic-video-detector", + "display_name": "synthetic-video-detector", "modalities": { "input": [ - "text" + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 8192, "output": 4096 }, "temperature": true, @@ -97317,56 +104654,53 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.16, - "output": 0.64 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5-chat", - "name": "GPT-5 Chat", - "display_name": "GPT-5 Chat", + "id": "nvidia/nemotron-3-super-120b-a12b", + "name": "Nemotron 3 Super", + "display_name": "Nemotron 3 Super", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 262144 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10-24", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2026-03-11", + "last_updated": "2026-03-11", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "deepseek-v3-0324", - "name": "DeepSeek-V3-0324", - "display_name": "DeepSeek-V3-0324", + "id": "nvidia/studiovoice", + "name": "studiovoice", + "display_name": "studiovoice", "modalities": { "input": [ "text" @@ -97376,29 +104710,28 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "release_date": "2024-10-03", + "last_updated": "2025-06-13", "cost": { - "input": 1.14, - "output": 4.56 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "nvidia/rerank-qa-mistral-4b", + "name": "rerank-qa-mistral-4b", + "display_name": "rerank-qa-mistral-4b", "modalities": { "input": [ "text" @@ -97409,73 +104742,58 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2024-03-17", + "last_updated": "2025-01-17", "cost": { - "input": 0.71, - "output": 0.71 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "nvidia/llama-3_1-nemotron-safety-guard-8b-v3", + "name": "llama-3.1-nemotron-safety-guard-8b-v3", + "display_name": "llama-3.1-nemotron-safety-guard-8b-v3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-06", - "last_updated": "2026-02-06", + "release_date": "2025-10-28", + "last_updated": "2025-10-28", "cost": { - "input": 0.6, - "output": 3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta-llama-3.1-8b-instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", + "id": "nvidia/llama-3_3-nemotron-super-49b-v1_5", + "name": "Llama 3.3 Nemotron Super 49B v1.5", + "display_name": "Llama 3.3 Nemotron Super 49B v1.5", "modalities": { "input": [ "text" @@ -97485,32 +104803,33 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 0.3, - "output": 0.61 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "ministral-3b", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "nvidia/streampetr", + "name": "streampetr", + "display_name": "streampetr", "modalities": { "input": [ - "text" + "video" ], "output": [ "text" @@ -97521,25 +104840,57 @@ "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-03", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.04, - "output": 0.04 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "phi-3-medium-4k-instruct", - "name": "Phi-3-medium-instruct (4k)", - "display_name": "Phi-3-medium-instruct (4k)", + "id": "nvidia/cosmos-transfer2_5-2b", + "name": "cosmos-transfer2.5-2b", + "display_name": "cosmos-transfer2.5-2b", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "video" + ] + }, + "limit": { + "context": 8192, + "output": 4096 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-02-26", + "last_updated": "2026-02-26", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + }, + { + "id": "nvidia/usdcode", + "name": "usdcode", + "display_name": "usdcode", "modalities": { "input": [ "text" @@ -97549,8 +104900,8 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": false, @@ -97558,24 +104909,23 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "open_weights": false, + "release_date": "2026-01-01", + "last_updated": "2026-01-01", "cost": { - "input": 0.17, - "output": 0.68 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout 17B 16E Instruct", - "display_name": "Llama 4 Scout 17B 16E Instruct", + "id": "nvidia/nemotron-voicechat", + "name": "nemotron-voicechat", + "display_name": "nemotron-voicechat", "modalities": { "input": [ "text", - "image" + "audio" ], "output": [ "text" @@ -97592,19 +104942,18 @@ }, "attachment": true, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0.2, - "output": 0.78 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "phi-3.5-mini-instruct", - "name": "Phi-3.5-mini-instruct", - "display_name": "Phi-3.5-mini-instruct", + "id": "nvidia/llama-3_2-nemoretriever-300m-embed-v1", + "name": "llama-3_2-nemoretriever-300m-embed-v1", + "display_name": "llama-3_2-nemoretriever-300m-embed-v1", "modalities": { "input": [ "text" @@ -97614,34 +104963,32 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 32768, + "output": 2048 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "release_date": "2025-07-24", + "last_updated": "2025-07-24", "cost": { - "input": 0.13, - "output": 0.52 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "phi-4-multimodal", - "name": "Phi-4-multimodal", - "display_name": "Phi-4-multimodal", + "id": "nvidia/llama-nemotron-rerank-vl-1b-v2", + "name": "llama-nemotron-rerank-vl-1b-v2", + "display_name": "llama-nemotron-rerank-vl-1b-v2", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ "text" @@ -97651,96 +104998,89 @@ "context": 128000, "output": 4096 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2026-03-31", + "last_updated": "2026-03-31", "cost": { - "input": 0.08, - "output": 0.32, - "input_audio": 4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "codex-mini", - "name": "Codex Mini", - "display_name": "Codex Mini", + "id": "nvidia/bevformer", + "name": "bevformer", + "display_name": "bevformer", "modalities": { "input": [ - "text" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-16", - "last_updated": "2025-05-16", + "open_weights": true, + "release_date": "2025-03-18", + "last_updated": "2025-07-20", "cost": { - "input": 1.5, - "output": 6, - "cache_read": 0.375 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.2-chat", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", + "id": "nvidia/llama-3_3-nemotron-super-49b-v1", + "name": "Llama 3.3 Nemotron Super 49B v1", + "display_name": "Llama 3.3 Nemotron Super 49B v1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-04-07", + "last_updated": "2025-04-07", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "nvidia/riva-translate-4b-instruct-v1_1", + "name": "riva-translate-4b-instruct-v1_1", + "display_name": "riva-translate-4b-instruct-v1_1", "modalities": { "input": [ "text" @@ -97751,299 +105091,185 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2025-12-12", + "last_updated": "2025-12-12", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 Mini", - "display_name": "GPT-5.4 Mini", + "id": "nvidia/nemotron-3-content-safety", + "name": "nemotron-3-content-safety", + "display_name": "nemotron-3-content-safety", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 4096 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.4-nano", - "name": "GPT-5.4 Nano", - "display_name": "GPT-5.4 Nano", + "id": "nvidia/llama-nemotron-embed-vl-1b-v2", + "name": "llama-nemotron-embed-vl-1b-v2", + "display_name": "llama-nemotron-embed-vl-1b-v2", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32768, + "output": 2048 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "open_weights": true, + "release_date": "2026-02-10", + "last_updated": "2026-02-10", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.4-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "nvidia/nemotron-3-nano-30b-a3b", + "name": "nemotron-3-nano-30b-a3b", + "display_name": "nemotron-3-nano-30b-a3b", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 131072, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "attachment": false, + "open_weights": true, + "knowledge": "2024-09", + "release_date": "2024-12", + "last_updated": "2024-12", "cost": { - "input": 30, - "output": 180, - "context_over_200k": { - "input": 60, - "output": 270 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "nvidia/nemotron-mini-4b-instruct", + "name": "nemotron-mini-4b-instruct", + "display_name": "nemotron-mini-4b-instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": false + "context": 128000, + "output": 8192 }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "attachment": false, + "open_weights": true, + "release_date": "2024-08-21", + "last_updated": "2024-08-26", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-4-fast-non-reasoning", - "name": "Grok 4 Fast (Non-Reasoning)", - "display_name": "Grok 4 Fast (Non-Reasoning)", + "id": "mistralai/mixtral-8x7b-instruct", + "name": "Mistral: Mixtral 8x7B Instruct", + "display_name": "Mistral: Mixtral 8x7B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "attachment": false, + "open_weights": true, + "release_date": "2023-12-10", + "last_updated": "2026-03-15", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "mistralai/mistral-7b-instruct-v03", + "name": "Mistral-7B-Instruct-v0.3", + "display_name": "Mistral-7B-Instruct-v0.3", "modalities": { "input": [ "text" @@ -98053,8 +105279,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -98062,55 +105288,50 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "open_weights": true, + "release_date": "2025-04-01", + "last_updated": "2025-04-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "mistralai/mistral-small-4-119b-2603", + "name": "mistral-small-4-119b-2603", + "display_name": "mistral-small-4-119b-2603", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "mistralai/mistral-large-3-675b-instruct-2512", + "name": "Mistral Large 3 675B Instruct 2512", + "display_name": "Mistral Large 3 675B Instruct 2512", "modalities": { "input": [ "text", @@ -98121,8 +105342,8 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -98130,21 +105351,20 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "cohere-command-r-plus-08-2024", - "name": "Command R+", - "display_name": "Command R+", + "id": "mistralai/mixtral-8x22b-instruct", + "name": "Mistral: Mixtral 8x22B Instruct", + "display_name": "Mistral: Mixtral 8x22B Instruct", "modalities": { "input": [ "text" @@ -98154,8 +105374,8 @@ ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 65536, + "output": 13108 }, "temperature": true, "tool_call": true, @@ -98164,53 +105384,48 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "release_date": "2024-04-17", + "last_updated": "2024-04-17", "cost": { - "input": 2.5, - "output": 10 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "mistralai/magistral-small-2506", + "name": "Magistral Small 2506", + "display_name": "Magistral Small 2506", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5-pro", - "name": "GPT-5 Pro", - "display_name": "GPT-5 Pro", + "id": "mistralai/mistral-medium-3-instruct", + "name": "Mistral Medium 3", + "display_name": "Mistral Medium 3", "modalities": { "input": [ "text", @@ -98221,94 +105436,60 @@ ] }, "limit": { - "context": 400000, - "output": 272000 + "context": 131072, + "output": 32768 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 15, - "output": 120 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "mistralai/devstral-2-123b-instruct-2512", + "name": "Devstral-2-123B-Instruct-2512", + "display_name": "Devstral-2-123B-Instruct-2512", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-08", + "last_updated": "2025-12-09", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "mistralai/mistral-nemotron", + "name": "mistral-nemotron", + "display_name": "mistral-nemotron", "modalities": { "input": [ "text" @@ -98318,77 +105499,86 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "open_weights": true, + "release_date": "2025-06-11", + "last_updated": "2025-06-12", "cost": { - "input": 0.3, - "output": 0.5, - "reasoning": 0.5, - "cache_read": 0.075 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "qwen/qwen3.5-122b-a10b", + "name": "Qwen3.5 122B-A10B", + "display_name": "Qwen3.5 122B-A10B", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.03 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "qwen/qwen3.5-397b-a17b", + "name": "Qwen3.5-397B-A17B", + "display_name": "Qwen3.5-397B-A17B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 262144, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -98398,26 +105588,30 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "attachment": true, + "open_weights": true, + "knowledge": "2026-01", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 3, - "output": 15, - "reasoning": 15, - "cache_read": 0.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen3-Next-80B-A3B-Thinking", + "display_name": "Qwen3-Next-80B-A3B-Thinking", "modalities": { "input": [ "text" @@ -98427,10 +105621,10 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262144, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -98439,33 +105633,61 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "qwen/qwen-image-edit", + "name": "Qwen Image Edit", + "display_name": "Qwen Image Edit", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-19", + "last_updated": "2025-08-19", + "cost": { + "input": 0, + "output": 0 + }, + "type": "imageGeneration" + }, + { + "id": "qwen/qwen2.5-coder-32b-instruct", + "name": "Qwen2.5 Coder 32b Instruct", + "display_name": "Qwen2.5 Coder 32b Instruct", "modalities": { "input": [ "text" @@ -98475,85 +105697,60 @@ ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "open_weights": true, + "release_date": "2024-11-06", + "last_updated": "2024-11-06", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "qwen/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262144, + "output": 66536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "cohere-command-r-08-2024", - "name": "Command R", - "display_name": "Command R", + "id": "qwen/qwen3-next-80b-a3b-instruct", + "name": "Qwen3-Next-80B-A3B-Instruct", + "display_name": "Qwen3-Next-80B-A3B-Instruct", "modalities": { "input": [ "text" @@ -98563,8 +105760,8 @@ ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -98572,54 +105769,52 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "qwen/qwen-image", + "name": "Qwen Image", + "display_name": "Qwen Image", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "input": 0, + "output": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "google/gemma-3-27b-it", + "name": "Gemma-3-27B-IT", + "display_name": "Gemma-3-27B-IT", "modalities": { "input": [ "text", @@ -98630,100 +105825,65 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", "cost": { - "input": 10, - "output": 30 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "google/gemma-4-31b-it", + "name": "Gemma-4-31B-IT", + "display_name": "Gemma-4-31B-IT", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 256000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "abliteration-ai": { - "id": "abliteration-ai", - "name": "abliteration.ai", - "display_name": "abliteration.ai", - "api": "https://api.abliteration.ai/v1", - "doc": "https://docs.abliteration.ai/models", - "models": [ + }, { - "id": "abliterated-model", - "name": "Abliterated Model", - "display_name": "Abliterated Model", + "id": "google/gemma-3n-e2b-it", + "name": "Gemma 3n E2b It", + "display_name": "Gemma 3n E2b It", "modalities": { "input": [ "text", @@ -98734,8 +105894,8 @@ ] }, "limit": { - "context": 150000, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -98744,59 +105904,52 @@ }, "attachment": true, "open_weights": true, - "release_date": "2026-01-06", - "last_updated": "2026-01-06", + "knowledge": "2024-06", + "release_date": "2025-06-12", + "last_updated": "2025-06-12", "cost": { - "input": 3, - "output": 3 + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "cohere": { - "id": "cohere", - "name": "Cohere", - "display_name": "Cohere", - "doc": "https://docs.cohere.com/docs/models", - "models": [ + }, { - "id": "command-a-reasoning-08-2025", - "name": "Command A Reasoning", - "display_name": "Command A Reasoning", + "id": "google/gemma-3n-e4b-it", + "name": "Gemma 3n E4b It", + "display_name": "Gemma 3n E4b It", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "knowledge": "2024-06", + "release_date": "2025-06-03", + "last_updated": "2025-06-03", "cost": { - "input": 2.5, - "output": 10 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "command-r7b-12-2024", - "name": "Command R7B", - "display_name": "Command R7B", + "id": "google/gemma-2-2b-it", + "name": "Gemma 2 2b It", + "display_name": "Gemma 2 2b It", "modalities": { "input": [ "text" @@ -98807,7 +105960,7 @@ }, "limit": { "context": 128000, - "output": 4000 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -98816,19 +105969,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-02-27", - "last_updated": "2024-02-27", + "release_date": "2024-07-16", + "last_updated": "2024-07-16", "cost": { - "input": 0.0375, - "output": 0.15 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "c4ai-aya-vision-8b", - "name": "Aya Vision 8B", - "display_name": "Aya Vision 8B", + "id": "google/google-paligemma", + "name": "paligemma", + "display_name": "paligemma", "modalities": { "input": [ "text", @@ -98839,8 +105991,8 @@ ] }, "limit": { - "context": 16000, - "output": 4000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": false, @@ -98849,46 +106001,53 @@ }, "attachment": true, "open_weights": true, - "release_date": "2025-03-04", - "last_updated": "2025-05-14", + "release_date": "2024-05-14", + "last_updated": "2024-08-26", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "command-r-plus-08-2024", - "name": "Command R+", - "display_name": "Command R+", + "id": "microsoft/phi-4-mini-instruct", + "name": "Phi-4-Mini", + "display_name": "Phi-4-Mini", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "attachment": true, + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", "cost": { - "input": 2.5, - "output": 10 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "c4ai-aya-expanse-8b", - "name": "Aya Expanse 8B", - "display_name": "Aya Expanse 8B", + "id": "microsoft/phi-4-multimodal-instruct", + "name": "Phi 4 Multimodal", + "display_name": "Phi 4 Multimodal", "modalities": { "input": [ "text" @@ -98898,24 +106057,27 @@ ] }, "limit": { - "context": 8000, - "output": 4000 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-10-24", - "last_updated": "2024-10-24", + "open_weights": false, + "release_date": "2025-07-26", + "last_updated": "2025-07-26", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "command-r7b-arabic-02-2025", - "name": "Command R7B Arabic", - "display_name": "Command R7B Arabic", + "id": "upstage/solar-10_7b-instruct", + "name": "solar-10.7b-instruct", + "display_name": "solar-10.7b-instruct", "modalities": { "input": [ "text" @@ -98926,7 +106088,7 @@ }, "limit": { "context": 128000, - "output": 4000 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -98935,80 +106097,99 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-02-27", - "last_updated": "2025-02-27", + "release_date": "2024-06-05", + "last_updated": "2025-04-10", "cost": { - "input": 0.0375, - "output": 0.15 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "command-a-vision-07-2025", - "name": "Command A Vision", - "display_name": "Command A Vision", + "id": "minimaxai/minimax-m2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8000 + "context": 204800, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-07-31", - "last_updated": "2025-07-31", + "knowledge": "2025-08", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 2.5, - "output": 10 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "c4ai-aya-vision-32b", - "name": "Aya Vision 32B", - "display_name": "Aya Vision 32B", + "id": "minimaxai/minimax-m2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4000 + "context": 204800, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "release_date": "2025-03-04", - "last_updated": "2025-05-14", + "release_date": "2026-03-18", + "last_updated": "2026-04-11", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "command-a-translate-08-2025", - "name": "Command A Translate", - "display_name": "Command A Translate", + "id": "sarvamai/sarvam-m", + "name": "sarvam-m", + "display_name": "sarvam-m", "modalities": { "input": [ "text" @@ -99018,8 +106199,8 @@ ] }, "limit": { - "context": 8000, - "output": 8000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -99028,19 +106209,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 2.5, - "output": 10 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "command-r-08-2024", - "name": "Command R", - "display_name": "Command R", + "id": "abacusai/dracarys-llama-3_1-70b-instruct", + "name": "dracarys-llama-3.1-70b-instruct", + "display_name": "dracarys-llama-3.1-70b-instruct", "modalities": { "input": [ "text" @@ -99051,7 +106231,7 @@ }, "limit": { "context": 128000, - "output": 4000 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -99060,19 +106240,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "release_date": "2024-09-11", + "last_updated": "2025-05-22", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "c4ai-aya-expanse-32b", - "name": "Aya Expanse 32B", - "display_name": "Aya Expanse 32B", + "id": "baai/bge-m3", + "name": "BGE M3", + "display_name": "BGE M3", "modalities": { "input": [ "text" @@ -99082,24 +106261,28 @@ ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 8192, + "output": 1024 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-10-24", - "last_updated": "2024-10-24", - "type": "chat" + "release_date": "2024-01-30", + "last_updated": "2026-04-30", + "cost": { + "input": 0, + "output": 0 + }, + "type": "embedding" }, { - "id": "command-a-03-2025", - "name": "Command A", - "display_name": "Command A", + "id": "meta/llama-3.1-70b-instruct", + "name": "Llama 3.1 70b Instruct", + "display_name": "Llama 3.1 70b Instruct", "modalities": { "input": [ "text" @@ -99109,8 +106292,8 @@ ] }, "limit": { - "context": 256000, - "output": 8000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -99119,28 +106302,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "release_date": "2024-07-16", + "last_updated": "2024-07-16", "cost": { - "input": 2.5, - "output": 10 + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "cloudferro-sherlock": { - "id": "cloudferro-sherlock", - "name": "CloudFerro Sherlock", - "display_name": "CloudFerro Sherlock", - "api": "https://api-sherlock.cloudferro.com/openai/v1/", - "doc": "https://docs.sherlock.cloudferro.com/", - "models": [ + }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "meta/esm2-650m", + "name": "esm2-650m", + "display_name": "esm2-650m", "modalities": { "input": [ "text" @@ -99150,66 +106323,61 @@ ] }, "limit": { - "context": 70000, - "output": 70000 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-10-09", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2024-08-29", + "last_updated": "2025-03-10", "cost": { - "input": 2.92, - "output": 2.92 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "OpenAI GPT OSS 120B", - "display_name": "OpenAI GPT OSS 120B", + "id": "meta/llama-3.2-90b-vision-instruct", + "name": "Llama-3.2-90B-Vision-Instruct", + "display_name": "Llama-3.2-90B-Vision-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 2.92, - "output": 2.92 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "speakleash/Bielik-11B-v3.0-Instruct", - "name": "Bielik 11B v3.0 Instruct", - "display_name": "Bielik 11B v3.0 Instruct", + "id": "meta/llama-3.2-1b-instruct", + "name": "Llama 3.2 1b Instruct", + "display_name": "Llama 3.2 1b Instruct", "modalities": { "input": [ "text" @@ -99219,8 +106387,8 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -99229,19 +106397,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", - "cost": { - "input": 0.67, - "output": 0.67 + "knowledge": "2023-12", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", + "cost": { + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "speakleash/Bielik-11B-v2.6-Instruct", - "name": "Bielik 11B v2.6 Instruct", - "display_name": "Bielik 11B v2.6 Instruct", + "id": "meta/esmfold", + "name": "esmfold", + "display_name": "esmfold", "modalities": { "input": [ "text" @@ -99251,130 +106419,94 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "release_date": "2024-03-15", + "last_updated": "2025-06-12", "cost": { - "input": 0.67, - "output": 0.67 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "meta/llama-3.2-11b-vision-instruct", + "name": "Llama 3.2 11b Vision Instruct", + "display_name": "Llama 3.2 11b Vision Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 196000, - "output": 16000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2023-12", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "kuae-cloud-coding-plan": { - "id": "kuae-cloud-coding-plan", - "name": "KUAE Cloud Coding Plan", - "display_name": "KUAE Cloud Coding Plan", - "api": "https://coding-plan-endpoint.kuaecloud.net/v1", - "doc": "https://docs.mthreads.com/kuaecloud/kuaecloud-doc-online/coding_plan/", - "models": [ + }, { - "id": "GLM-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "meta/llama-4-maverick-17b-128e-instruct", + "name": "Llama 4 Maverick 17b 128e Instruct", + "display_name": "Llama 4 Maverick 17b 128e Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2024-02", + "release_date": "2025-04-01", + "last_updated": "2025-04-01", "cost": { "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "output": 0 }, "type": "chat" - } - ] - }, - "xai": { - "id": "xai", - "name": "xai", - "display_name": "xai", - "doc": "https://docs.x.ai/docs/models", - "models": [ + }, { - "id": "grok-2-1212", - "name": "Grok 2 1212", - "display_name": "Grok 2 1212", + "id": "meta/llama-3.3-70b-instruct", + "name": "Llama 3.3 70b Instruct", + "display_name": "Llama 3.3 70b Instruct", "modalities": { "input": [ "text" @@ -99384,67 +106516,59 @@ ] }, "limit": { - "context": 120000, - "output": 100000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": false - }, "attachment": false, - "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-12-12", - "last_updated": "2024-12-12", + "open_weights": true, + "release_date": "2024-11-26", + "last_updated": "2024-11-26", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-vision-beta", - "name": "Grok Vision Beta", - "display_name": "Grok Vision Beta", + "id": "meta/llama-3.2-3b-instruct", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 32768, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "attachment": false, + "open_weights": true, + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 5, - "output": 15, - "cache_read": 5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-4.3", - "name": "Grok 4.3", - "display_name": "Grok 4.3", + "id": "meta/llama-guard-4-12b", + "name": "Llama Guard 4 12B", + "display_name": "Llama Guard 4 12B", "modalities": { "input": [ "text", @@ -99455,40 +106579,28 @@ ] }, "limit": { - "context": 1000000, - "output": 30000 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-05-01", - "last_updated": "2026-05-01", + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2026-04-30", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2, - "context_over_200k": { - "input": 2.5, - "output": 5, - "cache_read": 0.4 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-3-mini-fast", - "name": "Grok 3 Mini Fast", - "display_name": "Grok 3 Mini Fast", + "id": "meta/llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ "text" @@ -99498,32 +106610,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 16000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.6, - "output": 4, - "reasoning": 4, - "cache_read": 0.15 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-3-mini-latest", - "name": "Grok 3 Mini Latest", - "display_name": "Grok 3 Mini Latest", + "id": "stepfun-ai/step-3.5-flash", + "name": "Step 3.5 Flash", + "display_name": "Step 3.5 Flash", "modalities": { "input": [ "text" @@ -99533,8 +106642,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -99543,22 +106652,19 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "open_weights": true, + "release_date": "2026-02-02", + "last_updated": "2026-02-02", "cost": { - "input": 0.3, - "output": 0.5, - "reasoning": 0.5, - "cache_read": 0.075 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-3-fast", - "name": "Grok 3 Fast", - "display_name": "Grok 3 Fast", + "id": "deepseek-ai/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -99568,76 +106674,108 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 5, - "output": 25, - "cache_read": 1.25 + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "grok-2-vision-latest", - "name": "Grok 2 Vision Latest", - "display_name": "Grok 2 Vision Latest", + "id": "deepseek-ai/deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-20", - "last_updated": "2024-12-12", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" - }, + } + ] + }, + "anthropic": { + "id": "anthropic", + "name": "Anthropic", + "display_name": "Anthropic", + "doc": "https://docs.anthropic.com/en/docs/about-claude/models", + "models": [ { - "id": "grok-4.20-0309-reasoning", - "name": "Grok 4.20 (Reasoning)", - "display_name": "Grok 4.20 (Reasoning)", + "id": "claude-opus-4-1-20250805", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -99647,138 +106785,147 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-09", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 12, - "cache_read": 0.4 - } + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "Grok 4.1 Fast (Non-Reasoning)", - "display_name": "Grok 4.1 Fast (Non-Reasoning)", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "grok-3-mini-fast-latest", - "name": "Grok 3 Mini Fast Latest", - "display_name": "Grok 3 Mini Fast Latest", + "id": "claude-3-haiku-20240307", + "name": "Claude Haiku 3", + "display_name": "Claude Haiku 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", "cost": { - "input": 0.6, - "output": 4, - "reasoning": 4, - "cache_read": 0.15 + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "grok-4-fast", - "name": "Grok 4 Fast", - "display_name": "Grok 4 Fast", + "id": "claude-3-sonnet-20240229", + "name": "Claude Sonnet 3", + "display_name": "Claude Sonnet 3", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "knowledge": "2023-08-31", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "grok-3-latest", - "name": "Grok 3 Latest", - "display_name": "Grok 3 Latest", + "id": "claude-3-5-haiku-latest", + "name": "Claude Haiku 3.5 (latest)", + "display_name": "Claude Haiku 3.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 200000, "output": 8192 }, "temperature": true, @@ -99786,66 +106933,72 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "grok-2", - "name": "Grok 2", - "display_name": "Grok 2", + "id": "claude-3-opus-20240229", + "name": "Claude Opus 3", + "display_name": "Claude Opus 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "knowledge": "2023-08-31", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "claude-haiku-4-5-20251001", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -99853,39 +107006,36 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "grok-4.20-0309-non-reasoning", - "name": "Grok 4.20 (Non-Reasoning)", - "display_name": "Grok 4.20 (Non-Reasoning)", + "id": "claude-3-5-sonnet-20240620", + "name": "Claude Sonnet 3.5", + "display_name": "Claude Sonnet 3.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -99894,72 +107044,74 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-09", + "knowledge": "2024-04-30", + "release_date": "2024-06-20", + "last_updated": "2024-06-20", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 12, - "cache_read": 0.4 - } + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "grok-3-fast-latest", - "name": "Grok 3 Fast Latest", - "display_name": "Grok 3 Fast Latest", + "id": "claude-opus-4-0", + "name": "Claude Opus 4 (latest)", + "display_name": "Claude Opus 4 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 5, - "output": 25, - "cache_read": 1.25 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "grok-4.20-multi-agent-0309", - "name": "Grok 4.20 Multi-Agent", - "display_name": "Grok 4.20 Multi-Agent", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -99971,142 +107123,181 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-09", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 12, - "cache_read": 0.4 - } + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 1000000, "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { "input": 3, "output": 15, - "reasoning": 15, - "cache_read": 0.75 + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "grok-2-latest", - "name": "Grok 2 Latest", - "display_name": "Grok 2 Latest", + "id": "claude-sonnet-4-0", + "name": "Claude Sonnet 4 (latest)", + "display_name": "Claude Sonnet 4 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-20", - "last_updated": "2024-12-12", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "grok-beta", - "name": "Grok Beta", - "display_name": "Grok Beta", + "id": "claude-opus-4-1", + "name": "Claude Opus 4.1 (latest)", + "display_name": "Claude Opus 4.1 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 4096 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 5, - "output": 15, - "cache_read": 5 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "grok-2-vision", - "name": "Grok 2 Vision", - "display_name": "Grok 2 Vision", + "id": "claude-3-5-haiku-20241022", + "name": "Claude Haiku 3.5", + "display_name": "Claude Haiku 3.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -100115,66 +107306,70 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "grok-4-1-fast", - "name": "Grok 4.1 Fast", - "display_name": "Grok 4.1 Fast", + "id": "claude-3-5-sonnet-20241022", + "name": "Claude Sonnet 3.5 v2", + "display_name": "Claude Sonnet 3.5 v2", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "claude-opus-4-5-20251101", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -100182,276 +107377,366 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-03-31", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { - "input": 0.3, - "output": 0.5, - "reasoning": 0.5, - "cache_read": 0.075 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "grok-2-vision-1212", - "name": "Grok 2 Vision 1212", - "display_name": "Grok 2 Vision 1212", + "id": "claude-opus-4-20250514", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, + "context": 200000, "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false - }, - "search": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-20", - "last_updated": "2024-12-12", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "claude-sonnet-4-5-20250929", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { "input": 3, "output": 15, - "cache_read": 0.75 + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "grok-4-fast-non-reasoning", - "name": "Grok 4 Fast (Non-Reasoning)", - "display_name": "Grok 4 Fast (Non-Reasoning)", + "id": "claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "grok-3-mini-fast-beta", - "name": "Grok 3 Mini Fast Beta", - "display_name": "Grok 3 Mini Fast Beta", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 120000, - "output": 100000 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "effort": "low" - }, - "search": { - "supported": false - }, - "attachment": false, - "type": "chat" - }, - { - "id": "grok-3-mini-beta", - "name": "Grok 3 Mini Beta", - "display_name": "Grok 3 Mini Beta", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 120000, - "output": 100000 + "default": false }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true, - "effort": "low" + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, - "search": { - "supported": false + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, - "attachment": false, "type": "chat" }, { - "id": "grok-3-fast-beta", - "name": "Grok 3 Fast Beta", - "display_name": "Grok 3 Fast Beta", + "id": "claude-3-7-sonnet-20250219", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 120000, - "output": 100000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "search": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, - "attachment": false, "type": "chat" }, { - "id": "grok-2-image-1212", - "name": "Grok 2 Image 1212", - "display_name": "Grok 2 Image 1212", + "id": "claude-sonnet-4-20250514", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 130000, - "output": 100000 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "search": { - "supported": false + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, - "attachment": false, "type": "chat" }, { - "id": "grok-3-beta", - "name": "Grok 3 Beta", - "display_name": "Grok 3 Beta", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5 (latest)", + "display_name": "Claude Opus 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 120000, - "output": 100000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "search": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, - "attachment": false, "type": "chat" } ] }, - "meganova": { - "id": "meganova", - "name": "Meganova", - "display_name": "Meganova", - "api": "https://api.meganova.ai/v1", - "doc": "https://docs.meganova.ai", + "zhipuai-coding-plan": { + "id": "zhipuai-coding-plan", + "name": "Zhipu AI Coding Plan", + "display_name": "Zhipu AI Coding Plan", + "api": "https://open.bigmodel.cn/api/coding/paas/v4", + "doc": "https://docs.bigmodel.cn/cn/coding-plan/overview", "models": [ { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -100461,41 +107746,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-23", - "last_updated": "2025-07-23", - "cost": { - "input": 0.09, - "output": 0.6 - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen3.5-Plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", - "modalities": { - "input": [ - "text", - "image", - "video" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 65536 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -100516,50 +107768,66 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02", - "last_updated": "2026-02", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.4, - "output": 2.4, - "reasoning": 2.4 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-32B-Instruct", - "name": "Qwen2.5 VL 32B Instruct", - "display_name": "Qwen2.5 VL 32B Instruct", + "id": "glm-5v-turbo", + "name": "GLM-5V-Turbo", + "display_name": "GLM-5V-Turbo", "modalities": { "input": [ "text", - "image" + "image", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "open_weights": false, + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 0.2, - "output": 0.6 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7", + "id": "glm-4.7", "name": "GLM-4.7", "display_name": "GLM-4.7", "modalities": { @@ -100571,7 +107839,7 @@ ] }, "limit": { - "context": 202752, + "context": 204800, "output": 131072 }, "temperature": true, @@ -100597,15 +107865,17 @@ "release_date": "2025-12-22", "last_updated": "2025-12-22", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "zai-org/GLM-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "glm-5-turbo", + "name": "GLM-5-Turbo", + "display_name": "GLM-5-Turbo", "modalities": { "input": [ "text" @@ -100615,7 +107885,7 @@ ] }, "limit": { - "context": 202752, + "context": 200000, "output": 131072 }, "temperature": true, @@ -100636,19 +107906,21 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "open_weights": false, + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0.8, - "output": 2.56 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ "text" @@ -100658,8 +107930,8 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -100667,36 +107939,35 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.45, - "output": 1.9 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "atomic-chat": { + "id": "atomic-chat", + "name": "Atomic Chat", + "display_name": "Atomic Chat", + "api": "http://127.0.0.1:1337/v1", + "doc": "https://atomic.chat", + "models": [ { - "id": "mistralai/Mistral-Small-3.2-24B-Instruct-2506", - "name": "Mistral Small 3.2 24B Instruct", - "display_name": "Mistral Small 3.2 24B Instruct", + "id": "gemma-4-E4B-it-IQ4_XS", + "name": "Gemma 4 E4B Instruct (IQ4_XS)", + "display_name": "Gemma 4 E4B Instruct (IQ4_XS)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -100707,15 +107978,14 @@ "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-06-20", - "last_updated": "2025-06-20", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { "input": 0, "output": 0 @@ -100723,9 +107993,9 @@ "type": "chat" }, { - "id": "mistralai/Mistral-Nemo-Instruct-2407", - "name": "Mistral Nemo Instruct 2407", - "display_name": "Mistral Nemo Instruct 2407", + "id": "gemma-4-E4B-it-MLX-4bit", + "name": "Gemma 4 E4B Instruct (MLX 4-bit)", + "display_name": "Gemma 4 E4B Instruct (MLX 4-bit)", "modalities": { "input": [ "text" @@ -100735,61 +108005,60 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 32768, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.02, - "output": 0.04 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "XiaomiMiMo/MiMo-V2-Flash", - "name": "MiMo V2 Flash", - "display_name": "MiMo V2 Flash", + "id": "Qwen3_5-9B-Q4_K_M", + "name": "Qwen 3.5 9B (Q4_K_M)", + "display_name": "Qwen 3.5 9B (Q4_K_M)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32000 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "release_date": "2026-03-05", + "last_updated": "2026-04-04", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "Meta-Llama-3_1-8B-Instruct-GGUF", + "name": "Meta Llama 3.1 8B Instruct (GGUF)", + "display_name": "Meta Llama 3.1 8B Instruct (GGUF)", "modalities": { "input": [ "text" @@ -100800,7 +108069,7 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -100809,49 +108078,59 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "Qwen3_5-9B-MLX-4bit", + "name": "Qwen 3.5 9B (MLX 4-bit)", + "display_name": "Qwen 3.5 9B (MLX 4-bit)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-08-25", - "last_updated": "2025-08-25", + "release_date": "2026-03-05", + "last_updated": "2026-04-04", "cost": { - "input": 0.27, - "output": 1 + "input": 0, + "output": 0 }, "type": "chat" - }, + } + ] + }, + "github-models": { + "id": "github-models", + "name": "GitHub Models", + "display_name": "GitHub Models", + "api": "https://models.github.ai/inference", + "doc": "https://docs.github.com/en/github-models", + "models": [ { - "id": "deepseek-ai/DeepSeek-V3-0324", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "cohere/cohere-command-r-plus", + "name": "Cohere Command R+", + "display_name": "Cohere Command R+", "modalities": { "input": [ "text" @@ -100861,8 +108140,8 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -100870,19 +108149,20 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2024-04-04", + "last_updated": "2024-08-01", "cost": { - "input": 0.25, - "output": 0.88 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2-Exp", - "name": "DeepSeek V3.2 Exp", - "display_name": "DeepSeek V3.2 Exp", + "id": "cohere/cohere-command-r-plus-08-2024", + "name": "Cohere Command R+ 08-2024", + "display_name": "Cohere Command R+ 08-2024", "modalities": { "input": [ "text" @@ -100892,8 +108172,8 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -100901,19 +108181,20 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-10-10", - "last_updated": "2025-10-10", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2024-08-01", + "last_updated": "2024-08-01", "cost": { - "input": 0.27, - "output": 0.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", + "id": "cohere/cohere-command-r", + "name": "Cohere Command R", + "display_name": "Cohere Command R", "modalities": { "input": [ "text" @@ -100923,41 +108204,30 @@ ] }, "limit": { - "context": 163840, - "output": 64000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2024-03-11", + "last_updated": "2024-08-01", "cost": { - "input": 0.5, - "output": 2.15 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "cohere/cohere-command-r-08-2024", + "name": "Cohere Command R 08-2024", + "display_name": "Cohere Command R 08-2024", "modalities": { "input": [ "text" @@ -100967,33 +108237,29 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-03", - "last_updated": "2025-12-03", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2024-08-01", + "last_updated": "2024-08-01", "cost": { - "input": 0.26, - "output": 0.38 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "cohere/cohere-command-a", + "name": "Cohere Command A", + "display_name": "Cohere Command A", "modalities": { "input": [ "text" @@ -101003,8 +108269,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -101012,77 +108278,55 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.6, - "output": 2.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "attachment": true, + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0.45, - "output": 2.8 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "openai/o1-preview", + "name": "OpenAI o1-preview", + "display_name": "OpenAI o1-preview", "modalities": { "input": [ "text" @@ -101092,11 +108336,11 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -101104,234 +108348,261 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.1", - "name": "MiniMax M2.1", - "display_name": "MiniMax M2.1", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 131072 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.28, - "output": 1.2 + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "evroc": { - "id": "evroc", - "name": "evroc", - "display_name": "evroc", - "api": "https://models.think.evroc.com/v1", - "doc": "https://docs.evroc.com/products/think/overview.html", - "models": [ + }, { - "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", - "name": "Qwen3 VL 30B", - "display_name": "Qwen3 VL 30B", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1-mini", + "display_name": "GPT-4.1-mini", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 100000, - "output": 100000 + "context": 128000, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.24, - "output": 0.94 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Embedding-8B", - "name": "Qwen3 Embedding 8B", - "display_name": "Qwen3 Embedding 8B", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 128000, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "attachment": true, + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.12, - "output": 0.12 + "input": 0, + "output": 0 }, - "type": "embedding" + "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507-FP8", - "name": "Qwen3 30B 2507", - "display_name": "Qwen3 30B 2507", + "id": "openai/o1", + "name": "OpenAI o1", + "display_name": "OpenAI o1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 64000 + "context": 200000, + "output": 100000 }, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2024-09-12", + "last_updated": "2024-12-17", "cost": { - "input": 0.35, - "output": 1.42 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mistralai/devstral-small-2-24b-instruct-2512", - "name": "Devstral Small 2 24B Instruct 2512", - "display_name": "Devstral Small 2 24B Instruct 2512", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1-nano", + "display_name": "GPT-4.1-nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.12, - "output": 0.47 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mistralai/Voxtral-Small-24B-2507", - "name": "Voxtral Small 24B", - "display_name": "Voxtral Small 24B", + "id": "openai/o4-mini", + "name": "OpenAI o4-mini", + "display_name": "OpenAI o4-mini", "modalities": { "input": [ - "audio", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 200000, + "output": 100000 }, + "temperature": false, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.00236, - "output": 0.00236, - "output_audio": 2.36 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mistralai/Magistral-Small-2509", - "name": "Magistral Small 1.2 24B", - "display_name": "Magistral Small 1.2 24B", + "id": "openai/o3-mini", + "name": "OpenAI o3-mini", + "display_name": "OpenAI o3-mini", "modalities": { "input": [ "text" @@ -101341,27 +108612,44 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 100000 }, + "temperature": false, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.59, - "output": 2.36 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "microsoft/Phi-4-multimodal-instruct", - "name": "Phi-4 15B", - "display_name": "Phi-4 15B", + "id": "openai/o3", + "name": "OpenAI o3", + "display_name": "OpenAI o3", "modalities": { "input": [ "text", @@ -101372,58 +108660,44 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 200000, + "output": 100000 }, + "temperature": false, "tool_call": false, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0.24, - "output": 0.47 - }, - "type": "chat" - }, - { - "id": "KBLab/kb-whisper-large", - "name": "KB Whisper", - "display_name": "KB Whisper", - "modalities": { - "input": [ - "audio" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 448, - "output": 448 + "supported": true, + "default": true }, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.00236, - "output": 0.00236, - "output_audio": 2.36 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "nvidia/Llama-3.3-70B-Instruct-FP8", - "name": "Llama 3.3 70B", - "display_name": "Llama 3.3 70B", + "id": "openai/o1-mini", + "name": "OpenAI o1-mini", + "display_name": "OpenAI o1-mini", "modalities": { "input": [ "text" @@ -101433,58 +108707,44 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 65536 }, + "temperature": false, "tool_call": false, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", - "cost": { - "input": 1.18, - "output": 1.18 - }, - "type": "chat" - }, - { - "id": "openai/whisper-large-v3", - "name": "Whisper 3 Large", - "display_name": "Whisper 3 Large", - "modalities": { - "input": [ - "audio" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 448, - "output": 4096 + "supported": true, + "default": true }, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2024-09-12", + "last_updated": "2024-12-17", "cost": { - "input": 0.00236, - "output": 0.00236, - "output_audio": 2.36 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "ai21-labs/ai21-jamba-1.5-mini", + "name": "AI21 Jamba 1.5 Mini", + "display_name": "AI21 Jamba 1.5 Mini", "modalities": { "input": [ "text" @@ -101494,77 +108754,63 @@ ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 256000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2024-08-29", + "last_updated": "2024-08-29", "cost": { - "input": 0.24, - "output": 0.94 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "ai21-labs/ai21-jamba-1.5-large", + "name": "AI21 Jamba 1.5 Large", + "display_name": "AI21 Jamba 1.5 Large", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2024-08-29", + "last_updated": "2024-08-29", "cost": { - "input": 1.47, - "output": 5.9 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "intfloat/multilingual-e5-large-instruct", - "name": "E5 Multi-Lingual Large Embeddings 0.6B", - "display_name": "E5 Multi-Lingual Large Embeddings 0.6B", + "id": "core42/jais-30b-chat", + "name": "JAIS 30b Chat", + "display_name": "JAIS 30b Chat", "modalities": { "input": [ "text" @@ -101574,36 +108820,30 @@ ] }, "limit": { - "context": 512, - "output": 512 + "context": 8192, + "output": 2048 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "knowledge": "2023-03", + "release_date": "2023-08-30", + "last_updated": "2023-08-30", "cost": { - "input": 0.12, - "output": 0.12 + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "synthetic": { - "id": "synthetic", - "name": "Synthetic", - "display_name": "Synthetic", - "api": "https://api.synthetic.new/openai/v1", - "doc": "https://synthetic.new/pricing", - "models": [ + }, { - "id": "hf:meta-llama/Llama-3.1-405B-Instruct", - "name": "Llama-3.1-405B-Instruct", - "display_name": "Llama-3.1-405B-Instruct", + "id": "microsoft/phi-3-medium-128k-instruct", + "name": "Phi-3-medium instruct (128k)", + "display_name": "Phi-3-medium instruct (128k)", "modalities": { "input": [ "text" @@ -101614,7 +108854,7 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -101624,52 +108864,52 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 3, - "output": 3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:meta-llama/Llama-4-Scout-17B-16E-Instruct", - "name": "Llama-4-Scout-17B-16E-Instruct", - "display_name": "Llama-4-Scout-17B-16E-Instruct", + "id": "microsoft/phi-3-medium-4k-instruct", + "name": "Phi-3-medium instruct (4k)", + "display_name": "Phi-3-medium instruct (4k)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 328000, - "output": 4096 + "context": 4096, + "output": 1024 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "microsoft/phi-4", + "name": "Phi-4", + "display_name": "Phi-4", "modalities": { "input": [ "text" @@ -101679,8 +108919,8 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 16000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -101690,19 +108930,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.9, - "output": 0.9 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:meta-llama/Llama-3.1-8B-Instruct", - "name": "Llama-3.1-8B-Instruct", - "display_name": "Llama-3.1-8B-Instruct", + "id": "microsoft/phi-3-mini-128k-instruct", + "name": "Phi-3-mini instruct (128k)", + "display_name": "Phi-3-mini instruct (128k)", "modalities": { "input": [ "text" @@ -101713,7 +108953,7 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -101723,19 +108963,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:meta-llama/Llama-3.1-70B-Instruct", - "name": "Llama-3.1-70B-Instruct", - "display_name": "Llama-3.1-70B-Instruct", + "id": "microsoft/phi-4-reasoning", + "name": "Phi-4-Reasoning", + "display_name": "Phi-4-Reasoning", "modalities": { "input": [ "text" @@ -101746,7 +108986,7 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -101756,63 +108996,64 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.9, - "output": 0.9 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", - "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", - "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "id": "microsoft/phi-3-small-128k-instruct", + "name": "Phi-3-small instruct (128k)", + "display_name": "Phi-3-small instruct (128k)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 524000, + "context": 128000, "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.22, - "output": 0.88 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:MiniMaxAI/MiniMax-M2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "microsoft/phi-3.5-vision-instruct", + "name": "Phi-3.5-vision instruct (128k)", + "display_name": "Phi-3.5-vision instruct (128k)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 131000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -101820,25 +109061,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.55, - "output": 2.19 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "microsoft/phi-3-small-8k-instruct", + "name": "Phi-3-small instruct (8k)", + "display_name": "Phi-3-small instruct (8k)", "modalities": { "input": [ "text" @@ -101848,8 +109085,8 @@ ] }, "limit": { - "context": 191488, - "output": 65536 + "context": 8192, + "output": 2048 }, "temperature": true, "tool_call": true, @@ -101857,32 +109094,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2026-02-07", - "last_updated": "2026-02-07", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:MiniMaxAI/MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "microsoft/phi-3.5-moe-instruct", + "name": "Phi-3.5-MoE instruct (128k)", + "display_name": "Phi-3.5-MoE instruct (128k)", "modalities": { "input": [ "text" @@ -101892,8 +109118,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -101901,43 +109127,32 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.55, - "output": 2.19 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:Qwen/Qwen3.5-397B-A17B", - "name": "Qwen3.5-97B-A17B", - "display_name": "Qwen3.5-97B-A17B", + "id": "microsoft/phi-3.5-mini-instruct", + "name": "Phi-3.5-mini instruct (128k)", + "display_name": "Phi-3.5-mini instruct (128k)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -101945,32 +109160,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:Qwen/Qwen2.5-Coder-32B-Instruct", - "name": "Qwen2.5-Coder-32B-Instruct", - "display_name": "Qwen2.5-Coder-32B-Instruct", + "id": "microsoft/mai-ds-r1", + "name": "MAI-DS-R1", + "display_name": "MAI-DS-R1", "modalities": { "input": [ "text" @@ -101980,29 +109184,30 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 65536, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-11-11", - "last_updated": "2024-11-11", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.8, - "output": 0.8 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen 3 235B Instruct", - "display_name": "Qwen 3 235B Instruct", + "id": "microsoft/phi-3-mini-4k-instruct", + "name": "Phi-3-mini instruct (4k)", + "display_name": "Phi-3-mini instruct (4k)", "modalities": { "input": [ "text" @@ -102012,29 +109217,30 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 4096, + "output": 1024 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2025-07-21", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.2, - "output": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "microsoft/phi-4-mini-instruct", + "name": "Phi-4-mini-instruct", + "display_name": "Phi-4-mini-instruct", "modalities": { "input": [ "text" @@ -102044,8 +109250,8 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -102053,32 +109259,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.65, - "output": 3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen 3 Coder 480B", - "display_name": "Qwen 3 Coder 480B", + "id": "microsoft/phi-4-mini-reasoning", + "name": "Phi-4-mini-reasoning", + "display_name": "Phi-4-mini-reasoning", "modalities": { "input": [ "text" @@ -102088,32 +109283,35 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 2, - "output": 2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:deepseek-ai/DeepSeek-V3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "microsoft/phi-4-multimodal-instruct", + "name": "Phi-4-multimodal-instruct", + "display_name": "Phi-4-multimodal-instruct", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" @@ -102121,7 +109319,7 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -102130,19 +109328,20 @@ "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.56, - "output": 1.68 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:deepseek-ai/DeepSeek-V3-0324", - "name": "DeepSeek V3 (0324)", - "display_name": "DeepSeek V3 (0324)", + "id": "mistral-ai/mistral-large-2411", + "name": "Mistral Large 24.11", + "display_name": "Mistral Large 24.11", "modalities": { "input": [ "text" @@ -102153,27 +109352,29 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-08-01", - "last_updated": "2025-08-01", + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 1.2, - "output": 1.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:deepseek-ai/DeepSeek-V3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "mistral-ai/codestral-2501", + "name": "Codestral 25.01", + "display_name": "Codestral 25.01", "modalities": { "input": [ "text" @@ -102183,8 +109384,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 32000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -102193,20 +109394,20 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-29", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.25, - "output": 1.25 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:deepseek-ai/DeepSeek-R1", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "mistral-ai/mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -102217,7 +109418,7 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -102225,35 +109426,25 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2024-03", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.55, - "output": 2.19 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek R1 (0528)", - "display_name": "DeepSeek R1 (0528)", + "id": "mistral-ai/mistral-small-2503", + "name": "Mistral Small 3.1", + "display_name": "Mistral Small 3.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -102261,7 +109452,7 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -102269,42 +109460,33 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": false, - "release_date": "2025-08-01", - "last_updated": "2025-08-01", + "knowledge": "2024-09", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 3, - "output": 8 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "mistral-ai/mistral-medium-2505", + "name": "Mistral Medium 3 (25.05)", + "display_name": "Mistral Medium 3 (25.05)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 162816, - "output": 8000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -102312,27 +109494,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", "cost": { - "input": 0.27, - "output": 0.4, - "cache_read": 0.27, - "cache_write": 0 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", + "id": "mistral-ai/ministral-3b", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ "text" @@ -102343,7 +109519,7 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -102352,19 +109528,20 @@ "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-22", - "last_updated": "2025-09-25", + "open_weights": true, + "knowledge": "2024-03", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 1.2, - "output": 1.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "deepseek/deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -102374,8 +109551,8 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 65536, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -102385,23 +109562,30 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:moonshotai/Kimi-K2-Thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "deepseek/deepseek-r1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ "text" @@ -102411,8 +109595,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 65536, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -102433,19 +109617,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-11", - "release_date": "2025-11-07", - "last_updated": "2025-11-07", + "knowledge": "2024-06", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.55, - "output": 2.19 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:moonshotai/Kimi-K2-Instruct-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "deepseek/deepseek-v3-0324", + "name": "DeepSeek-V3-0324", + "display_name": "DeepSeek-V3-0324", "modalities": { "input": [ "text" @@ -102455,41 +109639,41 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2024-06", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 1.2, - "output": 1.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "xai/grok-3-mini", + "name": "Grok 3 Mini", + "display_name": "Grok 3 Mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -102497,32 +109681,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12-09", + "last_updated": "2024-12-09", "cost": { - "input": 0.55, - "output": 2.19 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:nvidia/NVIDIA-Nemotron-3-Super-120B-A12B-NVFP4", - "name": "Nemotron 3 Super 120B", - "display_name": "Nemotron 3 Super 120B", + "id": "xai/grok-3", + "name": "Grok 3", + "display_name": "Grok 3", "modalities": { "input": [ "text" @@ -102532,8 +109705,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -102541,45 +109714,32 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2026-03-11", - "last_updated": "2026-04-03", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12-09", + "last_updated": "2024-12-09", "cost": { - "input": 0.3, - "output": 1, - "cache_read": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:nvidia/Kimi-K2.5-NVFP4", - "name": "Kimi K2.5 (NVFP4)", - "display_name": "Kimi K2.5 (NVFP4)", + "id": "meta/meta-llama-3.1-405b-instruct", + "name": "Meta-Llama-3.1-405B-Instruct", + "display_name": "Meta-Llama-3.1-405B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -102587,32 +109747,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.55, - "output": 2.19 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:zai-org/GLM-4.7-Flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "meta/meta-llama-3.1-70b-instruct", + "name": "Meta-Llama-3.1-70B-Instruct", + "display_name": "Meta-Llama-3.1-70B-Instruct", "modalities": { "input": [ "text" @@ -102622,8 +109771,8 @@ ] }, "limit": { - "context": 196608, - "output": 65536 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -102631,43 +109780,33 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2026-01-18", - "last_updated": "2026-01-18", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.06, - "output": 0.4, - "cache_read": 0.06 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:zai-org/GLM-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "meta/llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -102675,43 +109814,33 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2024-12", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.55, - "output": 2.19 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:zai-org/GLM-5.1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "meta/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "display_name": "Llama 4 Scout 17B 16E Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -102719,32 +109848,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-04-12", + "knowledge": "2024-12", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 1, - "output": 3, - "cache_read": 1 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:zai-org/GLM-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "meta/meta-llama-3-70b-instruct", + "name": "Meta-Llama-3-70B-Instruct", + "display_name": "Meta-Llama-3-70B-Instruct", "modalities": { "input": [ "text" @@ -102754,8 +109872,8 @@ ] }, "limit": { - "context": 196608, - "output": 65536 + "context": 8192, + "output": 2048 }, "temperature": true, "tool_call": true, @@ -102763,43 +109881,34 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-04-08", + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 1, - "output": 3, - "cache_read": 1 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:zai-org/GLM-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "meta/llama-3.2-90b-vision-instruct", + "name": "Llama-3.2-90B-Vision-Instruct", + "display_name": "Llama-3.2-90B-Vision-Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -102807,38 +109916,32 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.55, - "output": 2.19 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:moonshotai/Kimi-K2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "meta/meta-llama-3-8b-instruct", + "name": "Meta-Llama-3-8B-Instruct", + "display_name": "Meta-Llama-3-8B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 8192, + "output": 2048 }, "temperature": true, "tool_call": true, @@ -102846,45 +109949,26 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.95 + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "nvidia": { - "id": "nvidia", - "name": "Nvidia", - "display_name": "Nvidia", - "api": "https://integrate.api.nvidia.com/v1", - "doc": "https://docs.api.nvidia.com/nim/", - "models": [ + }, { - "id": "upstage/solar-10_7b-instruct", - "name": "solar-10.7b-instruct", - "display_name": "solar-10.7b-instruct", + "id": "meta/llama-3.2-11b-vision-instruct", + "name": "Llama-3.2-11B-Vision-Instruct", + "display_name": "Llama-3.2-11B-Vision-Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" @@ -102897,12 +109981,14 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-06-05", - "last_updated": "2025-04-10", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { "input": 0, "output": 0 @@ -102910,32 +109996,32 @@ "type": "chat" }, { - "id": "black-forest-labs/flux_2-klein-4b", - "name": "FLUX.2 Klein 4B", - "display_name": "FLUX.2 Klein 4B", + "id": "meta/meta-llama-3.1-8b-instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ - "image", "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 128000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-01-14", - "last_updated": "2026-01-31", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { "input": 0, "output": 0 @@ -102943,108 +110029,121 @@ "type": "chat" }, { - "id": "black-forest-labs/flux.1-dev", - "name": "FLUX.1-dev", - "display_name": "FLUX.1-dev", + "id": "meta/llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 4096, - "output": 8192 + "context": 128000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-01", - "last_updated": "2025-09-05", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { "input": 0, "output": 0 }, "type": "chat" - }, + } + ] + }, + "qiniu-ai": { + "id": "qiniu-ai", + "name": "Qiniu", + "display_name": "Qiniu", + "api": "https://api.qnaigc.com/v1", + "doc": "https://developer.qiniu.com/aitokenapi", + "models": [ { - "id": "black-forest-labs/flux_1-schnell", - "name": "FLUX.1-schnell", - "display_name": "FLUX.1-schnell", + "id": "qwen3-30b-a3b-instruct-2507", + "name": "Qwen3 30b A3b Instruct 2507", + "display_name": "Qwen3 30b A3b Instruct 2507", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 77, - "output": 8192 + "context": 128000, + "output": 32000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-08-01", + "open_weights": false, + "release_date": "2026-02-04", "last_updated": "2026-02-04", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "black-forest-labs/flux_1-kontext-dev", - "name": "FLUX.1-Kontext-dev", - "display_name": "FLUX.1-Kontext-dev", + "id": "qwen3-max-preview", + "name": "Qwen3 Max Preview", + "display_name": "Qwen3 Max Preview", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 256000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-08-12", - "last_updated": "2025-08-12", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-06", + "last_updated": "2025-09-06", "type": "chat" }, { - "id": "stepfun-ai/step-3.5-flash", - "name": "Step 3.5 Flash", - "display_name": "Step 3.5 Flash", + "id": "doubao-seed-2.0-pro", + "name": "Doubao Seed 2.0 Pro", + "display_name": "Doubao Seed 2.0 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -103052,7 +110151,7 @@ }, "limit": { "context": 256000, - "output": 16384 + "output": 128000 }, "temperature": true, "tool_call": true, @@ -103060,20 +110159,16 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-02", - "last_updated": "2026-02-02", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "type": "chat" }, { - "id": "mistralai/mistral-large-3-675b-instruct-2512", - "name": "Mistral Large 3 675B Instruct 2512", - "display_name": "Mistral Large 3 675B Instruct 2512", + "id": "claude-3.7-sonnet", + "name": "Claude 3.7 Sonnet", + "display_name": "Claude 3.7 Sonnet", "modalities": { "input": [ "text", @@ -103084,40 +110179,58 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-12-02", - "last_updated": "2025-12-02", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "mistralai/devstral-2-123b-instruct-2512", - "name": "Devstral-2-123B-Instruct-2512", - "display_name": "Devstral-2-123B-Instruct-2512", + "id": "doubao-seed-2.0-code", + "name": "Doubao Seed 2.0 Code", + "display_name": "Doubao Seed 2.0 Code", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -103126,23 +110239,21 @@ "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-08", - "last_updated": "2025-12-09", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "type": "chat" }, { - "id": "mistralai/mistral-nemotron", - "name": "mistral-nemotron", - "display_name": "mistral-nemotron", + "id": "qwen2.5-vl-72b-instruct", + "name": "Qwen 2.5 VL 72B Instruct", + "display_name": "Qwen 2.5 VL 72B Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" @@ -103157,20 +110268,16 @@ "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-11", - "last_updated": "2025-06-12", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "mistralai/mixtral-8x22b-instruct", - "name": "Mistral: Mixtral 8x22B Instruct", - "display_name": "Mistral: Mixtral 8x22B Instruct", + "id": "deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -103180,59 +110287,86 @@ ] }, "limit": { - "context": 65536, - "output": 13108 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-17", - "last_updated": "2024-04-17", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "mistralai/mistral-medium-3-instruct", - "name": "Mistral Medium 3", - "display_name": "Mistral Medium 3", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1048576, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "mistralai/mixtral-8x7b-instruct", - "name": "Mistral: Mixtral 8x7B Instruct", - "display_name": "Mistral: Mixtral 8x7B Instruct", + "id": "deepseek-r1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ "text" @@ -103242,28 +110376,36 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2023-12-10", - "last_updated": "2026-03-15", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "mistralai/magistral-small-2506", - "name": "Magistral Small 2506", - "display_name": "Magistral Small 2506", + "id": "deepseek-v3-0324", + "name": "DeepSeek-V3-0324", + "display_name": "DeepSeek-V3-0324", "modalities": { "input": [ "text" @@ -103273,133 +110415,125 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 16000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "mistralai/mistral-7b-instruct-v03", - "name": "Mistral-7B-Instruct-v0.3", - "display_name": "Mistral-7B-Instruct-v0.3", + "id": "doubao-seed-2.0-mini", + "name": "Doubao Seed 2.0 Mini", + "display_name": "Doubao Seed 2.0 Mini", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-01", - "last_updated": "2025-04-01", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "type": "chat" }, { - "id": "mistralai/mistral-small-4-119b-2603", - "name": "mistral-small-4-119b-2603", - "display_name": "mistral-small-4-119b-2603", + "id": "claude-3.5-sonnet", + "name": "Claude 3.5 Sonnet", + "display_name": "Claude 3.5 Sonnet", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 8200 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2025-09-09", + "last_updated": "2025-09-09", "type": "chat" }, { - "id": "sarvamai/sarvam-m", - "name": "sarvam-m", - "display_name": "sarvam-m", + "id": "claude-4.0-sonnet", + "name": "Claude 4.0 Sonnet", + "display_name": "Claude 4.0 Sonnet", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-25", - "last_updated": "2025-07-25", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "microsoft/phi-4-mini-instruct", - "name": "Phi-4-Mini", - "display_name": "Phi-4-Mini", + "id": "doubao-seed-1.6-thinking", + "name": "Doubao-Seed 1.6 Thinking", + "display_name": "Doubao-Seed 1.6 Thinking", "modalities": { "input": [ - "text", "image", - "audio" + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -103409,19 +110543,14 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2025-09-05", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-08-15", + "last_updated": "2025-08-15", "type": "chat" }, { - "id": "microsoft/phi-4-multimodal-instruct", - "name": "Phi 4 Multimodal", - "display_name": "Phi 4 Multimodal", + "id": "deepseek-v3", + "name": "DeepSeek-V3", + "display_name": "DeepSeek-V3", "modalities": { "input": [ "text" @@ -103432,61 +110561,61 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 16000 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-08-13", + "last_updated": "2025-08-13", "type": "chat" }, { - "id": "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning", - "name": "Nemotron 3 Nano Omni", - "display_name": "Nemotron 3 Nano Omni", + "id": "qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 262144, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-28", - "last_updated": "2026-04-28", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "type": "chat" }, { - "id": "nvidia/usdvalidate", - "name": "usdvalidate", - "display_name": "usdvalidate", + "id": "glm-4.5-air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", "modalities": { "input": [ "text" @@ -103496,59 +110625,103 @@ ] }, "limit": { - "context": 8192, + "context": 131000, "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2024-07-24", - "last_updated": "2025-01-08", - "cost": { - "input": 0, - "output": 0 + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "type": "chat" + }, + { + "id": "qwen3-235b-a22b", + "name": "Qwen 3 235B A22B", + "display_name": "Qwen 3 235B A22B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/synthetic-video-detector", - "name": "synthetic-video-detector", - "display_name": "synthetic-video-detector", + "id": "qwen3.5-397b-a17b", + "name": "Qwen3.5 397B A17B", + "display_name": "Qwen3.5 397B A17B", "modalities": { "input": [ - "video" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 256000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-16", - "last_updated": "2026-04-16", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-22", + "last_updated": "2026-02-22", "type": "chat" }, { - "id": "nvidia/cosmos-transfer1-7b", - "name": "cosmos-transfer1-7b", - "display_name": "cosmos-transfer1-7b", + "id": "doubao-1.5-vision-pro", + "name": "Doubao 1.5 Vision Pro", + "display_name": "Doubao 1.5 Vision Pro", "modalities": { "input": [ "text", @@ -103556,63 +110729,57 @@ "video" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 128000, + "output": 16000 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-06-13", - "last_updated": "2025-06-30", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/rerank-qa-mistral-4b", - "name": "rerank-qa-mistral-4b", - "display_name": "rerank-qa-mistral-4b", + "id": "claude-4.5-haiku", + "name": "Claude 4.5 Haiku", + "display_name": "Claude 4.5 Haiku", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-03-17", - "last_updated": "2025-01-17", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-16", + "last_updated": "2025-10-16", "type": "chat" }, { - "id": "nvidia/nv-embedcode-7b-v1", - "name": "nv-embedcode-7b-v1", - "display_name": "nv-embedcode-7b-v1", + "id": "qwen-max-2025-01-25", + "name": "Qwen2.5-Max-2025-01-25", + "display_name": "Qwen2.5-Max-2025-01-25", "modalities": { "input": [ "text" @@ -103622,28 +110789,24 @@ ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 128000, + "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-03-17", - "last_updated": "2025-05-29", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/nemotron-3-super-120b-a12b", - "name": "Nemotron 3 Super", - "display_name": "Nemotron 3 Super", + "id": "doubao-1.5-thinking-pro", + "name": "Doubao 1.5 Thinking Pro", + "display_name": "Doubao 1.5 Thinking Pro", "modalities": { "input": [ "text" @@ -103653,8 +110816,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 16000 }, "temperature": true, "tool_call": true, @@ -103663,20 +110826,15 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2026-03-11", - "last_updated": "2026-03-11", - "cost": { - "input": 0.2, - "output": 0.8 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/riva-translate-4b-instruct-v1_1", - "name": "riva-translate-4b-instruct-v1_1", - "display_name": "riva-translate-4b-instruct-v1_1", + "id": "glm-4.5", + "name": "GLM 4.5", + "display_name": "GLM 4.5", "modalities": { "input": [ "text" @@ -103686,32 +110844,31 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 98304 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-12", - "last_updated": "2025-12-12", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/nemotron-voicechat", - "name": "nemotron-voicechat", - "display_name": "nemotron-voicechat", + "id": "qwen2.5-vl-7b-instruct", + "name": "Qwen 2.5 VL 7B Instruct", + "display_name": "Qwen 2.5 VL 7B Instruct", "modalities": { "input": [ "text", - "audio" + "image", + "audio", + "video" ], "output": [ "text" @@ -103727,19 +110884,15 @@ "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/llama-3_3-nemotron-super-49b-v1_5", - "name": "Llama 3.3 Nemotron Super 49B v1.5", - "display_name": "Llama 3.3 Nemotron Super 49B v1.5", + "id": "qwen-turbo", + "name": "Qwen-Turbo", + "display_name": "Qwen-Turbo", "modalities": { "input": [ "text" @@ -103749,8 +110902,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1000000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -103758,21 +110911,27 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/usdcode", - "name": "usdcode", - "display_name": "usdcode", + "id": "gpt-oss-20b", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ "text" @@ -103786,183 +110945,196 @@ "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2026-01-01", - "last_updated": "2026-01-01", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "type": "chat" }, { - "id": "nvidia/llama-3_2-nemoretriever-300m-embed-v1", - "name": "llama-3_2-nemoretriever-300m-embed-v1", - "display_name": "llama-3_2-nemoretriever-300m-embed-v1", + "id": "claude-4.0-opus", + "name": "Claude 4.0 Opus", + "display_name": "Claude 4.0 Opus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 200000, + "output": 32000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-24", - "last_updated": "2025-07-24", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/llama-3_1-nemotron-safety-guard-8b-v3", - "name": "llama-3.1-nemotron-safety-guard-8b-v3", - "display_name": "llama-3.1-nemotron-safety-guard-8b-v3", + "id": "claude-4.5-sonnet", + "name": "Claude 4.5 Sonnet", + "display_name": "Claude 4.5 Sonnet", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-10-28", - "last_updated": "2025-10-28", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "type": "chat" }, { - "id": "nvidia/nv-embed-v1", - "name": "nv-embed-v1", - "display_name": "nv-embed-v1", + "id": "claude-4.5-opus", + "name": "Claude 4.5 Opus", + "display_name": "Claude 4.5 Opus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 200000, + "output": 200000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-06-07", - "last_updated": "2025-07-22", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-25", + "last_updated": "2025-11-25", "type": "chat" }, { - "id": "nvidia/nemotron-3-nano-30b-a3b", - "name": "nemotron-3-nano-30b-a3b", - "display_name": "nemotron-3-nano-30b-a3b", + "id": "gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-12", - "last_updated": "2024-12", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/gliner-pii", - "name": "gliner-pii", - "display_name": "gliner-pii", + "id": "claude-4.1-opus", + "name": "Claude 4.1 Opus", + "display_name": "Claude 4.1 Opus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-03", - "last_updated": "2026-03-03", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "type": "chat" }, { - "id": "nvidia/bevformer", - "name": "bevformer", - "display_name": "bevformer", + "id": "doubao-seed-1.6", + "name": "Doubao-Seed 1.6", + "display_name": "Doubao-Seed 1.6", "modalities": { "input": [ + "text", + "image", "video" ], "output": [ @@ -103970,28 +111142,25 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 256000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-18", - "last_updated": "2025-07-20", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-15", + "last_updated": "2025-08-15", "type": "chat" }, { - "id": "nvidia/nemotron-mini-4b-instruct", - "name": "nemotron-mini-4b-instruct", - "display_name": "nemotron-mini-4b-instruct", + "id": "qwen3-30b-a3b-thinking-2507", + "name": "Qwen3 30b A3b Thinking 2507", + "display_name": "Qwen3 30b A3b Thinking 2507", "modalities": { "input": [ "text" @@ -104001,61 +111170,75 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 126000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-08-21", - "last_updated": "2024-08-26", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2026-02-04", + "last_updated": "2026-02-04", "type": "chat" }, { - "id": "nvidia/cosmos-predict1-5b", - "name": "cosmos-predict1-5b", - "display_name": "cosmos-predict1-5b", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, + "context": 40000, "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-03-18", - "last_updated": "2025-03-18", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/llama-3_3-nemotron-super-49b-v1", - "name": "Llama 3.3 Nemotron Super 49B v1", - "display_name": "Llama 3.3 Nemotron Super 49B v1", + "id": "qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ "text" @@ -104066,7 +111249,7 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -104074,32 +111257,41 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-04-07", - "last_updated": "2025-04-07", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-12", + "last_updated": "2025-09-12", "type": "chat" }, { - "id": "nvidia/nvidia-nemotron-nano-9b-v2", - "name": "nvidia-nemotron-nano-9b-v2", - "display_name": "nvidia-nemotron-nano-9b-v2", + "id": "gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "display_name": "Gemini 2.0 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -104107,152 +111299,158 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-09", - "release_date": "2025-08-18", - "last_updated": "2025-08-18", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/cosmos-transfer2_5-2b", - "name": "cosmos-transfer2.5-2b", - "display_name": "cosmos-transfer2.5-2b", + "id": "qwen-vl-max-2025-01-25", + "name": "Qwen VL-MAX-2025-01-25", + "display_name": "Qwen VL-MAX-2025-01-25", "modalities": { "input": [ "text", "image", + "audio", "video" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, + "context": 128000, "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-02-26", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/nemotron-content-safety-reasoning-4b", - "name": "nemotron-content-safety-reasoning-4b", - "display_name": "nemotron-content-safety-reasoning-4b", + "id": "doubao-seed-2.0-lite", + "name": "Doubao Seed 2.0 Lite", + "display_name": "Doubao Seed 2.0 Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 32000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-01-22", - "last_updated": "2026-01-22", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "type": "chat" }, { - "id": "nvidia/active-speaker-detection", - "name": "Active Speaker Detection", - "display_name": "Active Speaker Detection", + "id": "qwen3-30b-a3b", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, + "context": 40000, "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-16", - "last_updated": "2026-04-16", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/magpie-tts-zeroshot", - "name": "magpie-tts-zeroshot", - "display_name": "magpie-tts-zeroshot", + "id": "qwen3-vl-30b-a3b-thinking", + "name": "Qwen3-Vl 30b A3b Thinking", + "display_name": "Qwen3-Vl 30b A3b Thinking", "modalities": { "input": [ "text", - "audio" + "image", + "video" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 128000, + "output": 32000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-05-22", - "last_updated": "2025-06-12", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-09", + "last_updated": "2026-02-09", "type": "chat" }, { - "id": "nvidia/streampetr", - "name": "streampetr", - "display_name": "streampetr", + "id": "deepseek-v3.1", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ - "video" + "text" ], "output": [ "text" @@ -104260,121 +111458,127 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-19", + "last_updated": "2025-08-19", "type": "chat" }, { - "id": "nvidia/sparsedrive", - "name": "sparsedrive", - "display_name": "sparsedrive", + "id": "gemini-3.0-pro-image-preview", + "name": "Gemini 3.0 Pro Image Preview", + "display_name": "Gemini 3.0 Pro Image Preview", "modalities": { "input": [ - "video" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 128000, + "context": 32768, "output": 8192 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-03-18", - "last_updated": "2025-07-20", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "type": "chat" }, { - "id": "nvidia/nemotron-3-content-safety", - "name": "nemotron-3-content-safety", - "display_name": "nemotron-3-content-safety", + "id": "kling-v2-6", + "name": "Kling-V2 6", + "display_name": "Kling-V2 6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 99999999, + "output": 99999999 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-16", - "last_updated": "2026-04-16", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": true, + "open_weights": false, + "release_date": "2026-01-13", + "last_updated": "2026-01-13", "type": "chat" }, { - "id": "nvidia/llama-nemotron-embed-vl-1b-v2", - "name": "llama-nemotron-embed-vl-1b-v2", - "display_name": "llama-nemotron-embed-vl-1b-v2", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235b A22B Instruct 2507", + "display_name": "Qwen3 235b A22B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 262144, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-10", - "last_updated": "2026-02-10", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-12", + "last_updated": "2025-08-12", "type": "chat" }, { - "id": "nvidia/studiovoice", - "name": "studiovoice", - "display_name": "studiovoice", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -104384,60 +111588,73 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-10-03", - "last_updated": "2025-06-13", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-14", + "last_updated": "2025-08-14", "type": "chat" }, { - "id": "nvidia/llama-nemotron-rerank-vl-1b-v2", - "name": "llama-nemotron-rerank-vl-1b-v2", - "display_name": "llama-nemotron-rerank-vl-1b-v2", + "id": "gemini-3.0-pro-preview", + "name": "Gemini 3.0 Pro Preview", + "display_name": "Gemini 3.0 Pro Preview", "modalities": { "input": [ "text", - "image" + "image", + "video", + "pdf", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2026-03-31", - "last_updated": "2026-03-31", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "type": "chat" }, { - "id": "deepseek-ai/deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ "text" @@ -104447,8 +111664,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 262144, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -104458,24 +111675,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-08-12", + "last_updated": "2025-08-12", "type": "chat" }, { - "id": "deepseek-ai/deepseek-v3.1-terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", + "id": "kimi-k2", + "name": "Kimi K2", + "display_name": "Kimi K2", "modalities": { "input": [ "text" @@ -104486,61 +111704,53 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "openai/whisper-large-v3", - "name": "Whisper Large v3", - "display_name": "Whisper Large v3", + "id": "doubao-seed-1.6-flash", + "name": "Doubao-Seed 1.6 Flash", + "display_name": "Doubao-Seed 1.6 Flash", "modalities": { "input": [ - "audio" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 256000, + "output": 32000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-09", - "release_date": "2023-09-01", - "last_updated": "2025-09-05", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-15", + "last_updated": "2025-08-15", "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "MiniMax-M1", + "name": "MiniMax M1", + "display_name": "MiniMax M1", "modalities": { "input": [ "text" @@ -104550,8 +111760,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1000000, + "output": 80000 }, "temperature": true, "tool_call": true, @@ -104559,63 +111769,95 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": true, + "open_weights": false, "release_date": "2025-08-05", "last_updated": "2025-08-05", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT-OSS-120B", - "display_name": "GPT-OSS-120B", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1048576, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08", - "release_date": "2025-08-04", - "last_updated": "2025-08-14", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "minimaxai/minimax-m2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "gemini-2.5-flash-image", + "name": "Gemini 2.5 Flash Image", + "display_name": "Gemini 2.5 Flash Image", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 32768, + "output": 8192 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-22", + "last_updated": "2025-10-22", + "type": "imageGeneration" + }, + { + "id": "doubao-1.5-pro-32k", + "name": "Doubao 1.5 Pro 32k", + "display_name": "Doubao 1.5 Pro 32k", "modalities": { "input": [ "text" @@ -104625,40 +111867,24 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 12000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-04-11", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "minimaxai/minimax-m2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ "text" @@ -104668,79 +111894,52 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-08", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-09-12", + "last_updated": "2025-09-12", "type": "chat" }, { - "id": "z-ai/glm4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "claude-3.5-haiku", + "name": "Claude 3.5 Haiku", + "display_name": "Claude 3.5 Haiku", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", - "cost": { - "input": 0, - "output": 0 + "supported": false }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-26", + "last_updated": "2025-08-26", "type": "chat" }, { - "id": "z-ai/glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ "text" @@ -104750,8 +111949,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -104761,188 +111960,205 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "type": "chat" }, { - "id": "meta/esm2-650m", - "name": "esm2-650m", - "display_name": "esm2-650m", + "id": "gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 1048576, "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-08-29", - "last_updated": "2025-03-10", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "meta/llama-3.3-70b-instruct", - "name": "Llama 3.3 70b Instruct", - "display_name": "Llama 3.3 70b Instruct", + "id": "gemini-3.0-flash-preview", + "name": "Gemini 3.0 Flash Preview", + "display_name": "Gemini 3.0 Flash Preview", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-11-26", - "last_updated": "2024-11-26", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "type": "chat" }, { - "id": "meta/esmfold", - "name": "esmfold", - "display_name": "esmfold", + "id": "moonshotai/kimi-k2.5", + "name": "Moonshotai/Kimi-K2.5", + "display_name": "Moonshotai/Kimi-K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 256000, + "output": 256000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-03-15", - "last_updated": "2025-06-12", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": true, + "open_weights": false, + "release_date": "2026-01-28", + "last_updated": "2026-01-28", "type": "chat" }, { - "id": "meta/llama-3.2-90b-vision-instruct", - "name": "Llama-3.2-90B-Vision-Instruct", - "display_name": "Llama-3.2-90B-Vision-Instruct", + "id": "moonshotai/kimi-k2-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 256000, + "output": 100000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-08", + "last_updated": "2025-09-08", "type": "chat" }, { - "id": "meta/llama-3.2-11b-vision-instruct", - "name": "Llama 3.2 11b Vision Instruct", - "display_name": "Llama 3.2 11b Vision Instruct", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 100000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-18", - "last_updated": "2024-09-18", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-07", + "last_updated": "2025-11-07", "type": "chat" }, { - "id": "meta/llama-guard-4-12b", - "name": "Llama Guard 4 12B", - "display_name": "Llama Guard 4 12B", + "id": "z-ai/autoglm-phone-9b", + "name": "Z-Ai/Autoglm Phone 9b", + "display_name": "Z-Ai/Autoglm Phone 9b", "modalities": { "input": [ "text", @@ -104953,28 +112169,24 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 12800, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2026-04-30", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "type": "chat" }, { - "id": "meta/llama-3.1-70b-instruct", - "name": "Llama 3.1 70b Instruct", - "display_name": "Llama 3.1 70b Instruct", + "id": "z-ai/glm-4.6", + "name": "Z-AI/GLM 4.6", + "display_name": "Z-AI/GLM 4.6", "modalities": { "input": [ "text" @@ -104984,28 +112196,29 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 200000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-16", - "last_updated": "2024-07-16", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-10-11", + "last_updated": "2025-10-11", "type": "chat" }, { - "id": "meta/llama-3.2-1b-instruct", - "name": "Llama 3.2 1b Instruct", - "display_name": "Llama 3.2 1b Instruct", + "id": "z-ai/glm-4.7", + "name": "Z-Ai/GLM 4.7", + "display_name": "Z-Ai/GLM 4.7", "modalities": { "input": [ "text" @@ -105015,93 +112228,126 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 200000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-18", - "last_updated": "2024-09-18", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "type": "chat" }, { - "id": "meta/llama-4-maverick-17b-128e-instruct", - "name": "Llama 4 Maverick 17b 128e Instruct", - "display_name": "Llama 4 Maverick 17b 128e Instruct", + "id": "z-ai/glm-5", + "name": "Z-Ai/GLM 5", + "display_name": "Z-Ai/GLM 5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-02", - "release_date": "2025-04-01", - "last_updated": "2025-04-01", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "type": "chat" }, { - "id": "meta/llama-3.2-3b-instruct", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "openai/gpt-5.2", + "name": "OpenAI/GPT-5.2", + "display_name": "OpenAI/GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32000 + "context": 400000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-09-18", - "last_updated": "2024-09-18", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "type": "chat" }, { - "id": "meta/llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "openai/gpt-5", + "name": "OpenAI/GPT-5", + "display_name": "OpenAI/GPT-5", "modalities": { "input": [ "text" @@ -105111,75 +112357,90 @@ ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "type": "chat" }, { - "id": "qwen/qwen-image-edit", - "name": "Qwen Image Edit", - "display_name": "Qwen Image Edit", + "id": "minimax/minimax-m2.1", + "name": "Minimax/Minimax-M2.1", + "display_name": "Minimax/Minimax-M2.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 204800, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-19", - "last_updated": "2025-08-19", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true + } }, - "type": "imageGeneration" + "attachment": false, + "open_weights": false, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "type": "chat" }, { - "id": "qwen/qwen3.5-122b-a10b", - "name": "Qwen3.5 122B-A10B", - "display_name": "Qwen3.5 122B-A10B", + "id": "minimax/minimax-m2", + "name": "Minimax/Minimax-M2", + "display_name": "Minimax/Minimax-M2", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -105189,29 +112450,19 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-23", - "last_updated": "2026-02-23", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": false, + "open_weights": false, + "release_date": "2025-10-28", + "last_updated": "2025-10-28", "type": "chat" }, { - "id": "qwen/qwen2.5-coder-32b-instruct", - "name": "Qwen2.5 Coder 32b Instruct", - "display_name": "Qwen2.5 Coder 32b Instruct", + "id": "minimax/minimax-m2.5", + "name": "Minimax/Minimax-M2.5", + "display_name": "Minimax/Minimax-M2.5", "modalities": { "input": [ "text" @@ -105221,40 +112472,41 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 204800, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-11-06", - "last_updated": "2024-11-06", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true + } }, + "attachment": false, + "open_weights": false, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "type": "chat" }, { - "id": "qwen/qwen3.5-397b-a17b", - "name": "Qwen3.5-397B-A17B", - "display_name": "Qwen3.5-397B-A17B", + "id": "minimax/minimax-m2.5-highspeed", + "name": "Minimax/Minimax-M2.5 Highspeed", + "display_name": "Minimax/Minimax-M2.5 Highspeed", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 8192 + "context": 204800, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -105264,30 +112516,19 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, - "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": false, + "open_weights": false, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "type": "chat" }, { - "id": "qwen/qwen3-next-80b-a3b-thinking", - "name": "Qwen3-Next-80B-A3B-Thinking", - "display_name": "Qwen3-Next-80B-A3B-Thinking", + "id": "x-ai/grok-code-fast-1", + "name": "x-AI/Grok-Code-Fast 1", + "display_name": "x-AI/Grok-Code-Fast 1", "modalities": { "input": [ "text" @@ -105297,8 +112538,8 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 256000, + "output": 10000 }, "temperature": true, "tool_call": true, @@ -105308,126 +112549,112 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2025-09-05", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-09-02", + "last_updated": "2025-09-02", "type": "chat" }, { - "id": "qwen/qwen3-next-80b-a3b-instruct", - "name": "Qwen3-Next-80B-A3B-Instruct", - "display_name": "Qwen3-Next-80B-A3B-Instruct", + "id": "x-ai/grok-4.1-fast-reasoning", + "name": "X-Ai/Grok 4.1 Fast Reasoning", + "display_name": "X-Ai/Grok 4.1 Fast Reasoning", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 20000000, + "output": 2000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2025-09-05", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-12-19", + "last_updated": "2025-12-19", "type": "chat" }, { - "id": "qwen/qwen-image", - "name": "Qwen Image", - "display_name": "Qwen Image", + "id": "x-ai/grok-4.1-fast-non-reasoning", + "name": "X-Ai/Grok 4.1 Fast Non Reasoning", + "display_name": "X-Ai/Grok 4.1 Fast Non Reasoning", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 2000000, + "output": 2000000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 0, - "output": 0 - }, - "type": "imageGeneration" + "release_date": "2025-12-19", + "last_updated": "2025-12-19", + "type": "chat" }, { - "id": "qwen/qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "x-ai/grok-4-fast", + "name": "x-AI/Grok-4-Fast", + "display_name": "x-AI/Grok-4-Fast", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-09-20", + "last_updated": "2025-09-20", "type": "chat" }, { - "id": "google/gemma-2-2b-it", - "name": "Gemma 2 2b It", - "display_name": "Gemma 2 2b It", + "id": "x-ai/grok-4.1-fast", + "name": "x-AI/Grok-4.1-Fast", + "display_name": "x-AI/Grok-4.1-Fast", "modalities": { "input": [ "text" @@ -105437,65 +112664,61 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2024-07-16", - "last_updated": "2024-07-16", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "type": "chat" }, { - "id": "google/gemma-3n-e4b-it", - "name": "Gemma 3n E4b It", - "display_name": "Gemma 3n E4b It", + "id": "x-ai/grok-4-fast-non-reasoning", + "name": "X-Ai/Grok-4-Fast-Non-Reasoning", + "display_name": "X-Ai/Grok-4-Fast-Non-Reasoning", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-06-03", - "last_updated": "2025-06-03", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "type": "chat" }, { - "id": "google/gemma-4-31b-it", - "name": "Gemma-4-31B-IT", - "display_name": "Gemma-4-31B-IT", + "id": "x-ai/grok-4-fast-reasoning", + "name": "X-Ai/Grok-4-Fast-Reasoning", + "display_name": "X-Ai/Grok-4-Fast-Reasoning", "modalities": { "input": [ "text", "image", + "audio", "video" ], "output": [ @@ -105503,8 +112726,8 @@ ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, @@ -105512,25 +112735,24 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true + } }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "type": "chat" }, { - "id": "google/gemma-3n-e2b-it", - "name": "Gemma 3n E2b It", - "display_name": "Gemma 3n E2b It", + "id": "deepseek/deepseek-v3.2-exp", + "name": "DeepSeek/DeepSeek-V3.2-Exp", + "display_name": "DeepSeek/DeepSeek-V3.2-Exp", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -105538,94 +112760,79 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-06-12", - "last_updated": "2025-06-12", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "type": "chat" }, { - "id": "google/gemma-3-27b-it", - "name": "Gemma-3-27B-IT", - "display_name": "Gemma-3-27B-IT", + "id": "deepseek/deepseek-v3.1-terminus-thinking", + "name": "DeepSeek/DeepSeek-V3.1-Terminus-Thinking", + "display_name": "DeepSeek/DeepSeek-V3.1-Terminus-Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2025-09-05", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "type": "chat" }, { - "id": "google/google-paligemma", - "name": "paligemma", - "display_name": "paligemma", + "id": "deepseek/deepseek-math-v2", + "name": "Deepseek/Deepseek-Math-V2", + "display_name": "Deepseek/Deepseek-Math-V2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 160000, + "output": 160000 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2024-05-14", - "last_updated": "2024-08-26", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, + "attachment": false, + "open_weights": false, + "release_date": "2025-12-04", + "last_updated": "2025-12-04", "type": "chat" }, { - "id": "moonshotai/kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "deepseek/deepseek-v3.2-251201", + "name": "Deepseek/DeepSeek-V3.2", + "display_name": "Deepseek/DeepSeek-V3.2", "modalities": { "input": [ "text" @@ -105636,7 +112843,7 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 32000 }, "temperature": true, "tool_call": true, @@ -105646,65 +112853,42 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-01", - "release_date": "2025-01-01", - "last_updated": "2025-09-05", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "type": "chat" }, { - "id": "moonshotai/kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "deepseek/deepseek-v3.2-exp-thinking", + "name": "DeepSeek/DeepSeek-V3.2-Exp-Thinking", + "display_name": "DeepSeek/DeepSeek-V3.2-Exp-Thinking", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "type": "chat" }, { - "id": "moonshotai/kimi-k2-instruct-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "deepseek/deepseek-v3.1-terminus", + "name": "DeepSeek/DeepSeek-V3.1-Terminus", + "display_name": "DeepSeek/DeepSeek-V3.1-Terminus", "modalities": { "input": [ "text" @@ -105714,8 +112898,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -105723,66 +112907,43 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "stepfun/step-3.5-flash", + "name": "Stepfun/Step-3.5 Flash", + "display_name": "Stepfun/Step-3.5 Flash", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 64000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-11", - "last_updated": "2025-12", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "supported": false }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-02", + "last_updated": "2026-02-02", "type": "chat" }, { - "id": "abacusai/dracarys-llama-3_1-70b-instruct", - "name": "dracarys-llama-3.1-70b-instruct", - "display_name": "dracarys-llama-3.1-70b-instruct", + "id": "meituan/longcat-flash-chat", + "name": "Meituan/Longcat-Flash-Chat", + "display_name": "Meituan/Longcat-Flash-Chat", "modalities": { "input": [ "text" @@ -105792,28 +112953,24 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-09-11", - "last_updated": "2025-05-22", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-11-05", + "last_updated": "2025-11-05", "type": "chat" }, { - "id": "baai/bge-m3", - "name": "BGE M3", - "display_name": "BGE M3", + "id": "meituan/longcat-flash-lite", + "name": "Meituan/Longcat-Flash-Lite", + "display_name": "Meituan/Longcat-Flash-Lite", "modalities": { "input": [ "text" @@ -105823,64 +112980,52 @@ ] }, "limit": { - "context": 8192, - "output": 1024 + "context": 256000, + "output": 320000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-01-30", - "last_updated": "2026-04-30", - "cost": { - "input": 0, - "output": 0 - }, - "type": "embedding" + "open_weights": false, + "release_date": "2026-02-06", + "last_updated": "2026-02-06", + "type": "chat" }, { - "id": "bytedance/seed-oss-36b-instruct", - "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", - "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "id": "stepfun-ai/gelab-zero-4b-preview", + "name": "Stepfun-Ai/Gelab Zero 4b Preview", + "display_name": "Stepfun-Ai/Gelab Zero 4b Preview", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 8192, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-04", - "last_updated": "2025-11-25", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "type": "chat" }, { - "id": "deepseek-ai/deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "mimo-v2-flash", + "name": "Mimo-V2-Flash", + "display_name": "Mimo-V2-Flash", "modalities": { "input": [ "text" @@ -105890,8 +113035,8 @@ ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -105899,33 +113044,22 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 0.1, + "output": 0.3, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "xiaomi/mimo-v2-flash", + "name": "Xiaomi/Mimo-V2-Flash", + "display_name": "Xiaomi/Mimo-V2-Flash", "modalities": { "input": [ "text" @@ -105935,8 +113069,8 @@ ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -105944,74 +113078,69 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 0.1, + "output": 0.3, + "cache_read": 0.01 }, "type": "chat" } ] }, - "inference": { - "id": "inference", - "name": "Inference", - "display_name": "Inference", - "api": "https://inference.net/v1", - "doc": "https://inference.net/models", + "google": { + "id": "google", + "name": "google", + "display_name": "google", + "doc": "https://ai.google.dev/gemini-api/docs/models", "models": [ { - "id": "mistral/mistral-nemo-12b-instruct", - "name": "Mistral Nemo 12B Instruct", - "display_name": "Mistral Nemo 12B Instruct", + "id": "gemini-flash-latest", + "name": "Gemini Flash Latest", + "display_name": "Gemini Flash Latest", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.038, - "output": 0.1 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "input_audio": 1 }, "type": "chat" }, { - "id": "meta/llama-3.2-11b-vision-instruct", - "name": "Llama 3.2 11B Vision Instruct", - "display_name": "Llama 3.2 11B Vision Instruct", + "id": "gemma-4-26b-a4b-it", + "name": "Gemma 4 26B", + "display_name": "Gemma 4 26B", "modalities": { "input": [ "text", @@ -106022,125 +113151,170 @@ ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0.055, - "output": 0.055 - }, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "type": "chat" }, { - "id": "meta/llama-3.2-1b-instruct", - "name": "Llama 3.2 1B Instruct", - "display_name": "Llama 3.2 1B Instruct", + "id": "gemini-1.5-flash", + "name": "Gemini 1.5 Flash", + "display_name": "Gemini 1.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 1000000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-05-14", + "last_updated": "2024-05-14", "cost": { - "input": 0.01, - "output": 0.01 + "input": 0.075, + "output": 0.3, + "cache_read": 0.01875 }, "type": "chat" }, { - "id": "meta/llama-3.2-3b-instruct", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "gemini-3.1-flash-lite", + "name": "Gemini 3.1 Flash Lite", + "display_name": "Gemini 3.1 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-05-07", + "last_updated": "2026-05-07", "cost": { - "input": 0.02, - "output": 0.02 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "meta/llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "gemini-2.5-flash-preview-09-2025", + "name": "Gemini 2.5 Flash Preview 09 2025", + "display_name": "Gemini 2.5 Flash Preview 09 2025", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true, + "budget": { + "default": -1, + "min": 0, + "max": 24576 + } + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "search": { + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.025, - "output": 0.025 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "input_audio": 1 }, "type": "chat" }, { - "id": "qwen/qwen-2.5-7b-vision-instruct", - "name": "Qwen 2.5 7B Vision Instruct", - "display_name": "Qwen 2.5 7B Vision Instruct", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", @@ -106151,361 +113325,401 @@ ] }, "limit": { - "context": 125000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" - }, - { - "id": "qwen/qwen3-embedding-4b", - "name": "Qwen 3 Embedding 4B", - "display_name": "Qwen 3 Embedding 4B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] + "supported": true, + "default": true, + "budget": { + "default": -1, + "min": 128, + "max": 32768 + } }, - "limit": { - "context": 32000, - "output": 2048 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false + "search": { + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.01, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + } }, - "type": "embedding" + "type": "chat" }, { - "id": "google/gemma-3", - "name": "Google Gemma 3", - "display_name": "Google Gemma 3", + "id": "gemini-2.5-flash-preview-04-17", + "name": "Gemini 2.5 Flash Preview 04-17", + "display_name": "Gemini 2.5 Flash Preview 04-17", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 125000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-04-17", + "last_updated": "2025-04-17", "cost": { "input": 0.15, - "output": 0.3 + "output": 0.6, + "cache_read": 0.0375 }, "type": "chat" }, { - "id": "osmosis/osmosis-structure-0.6b", - "name": "Osmosis Structure 0.6B", - "display_name": "Osmosis Structure 0.6B", + "id": "gemma-3-27b-it", + "name": "Gemma 3 27B", + "display_name": "Gemma 3 27B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4000, - "output": 2048 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2024-10", + "release_date": "2025-03-12", + "last_updated": "2025-03-12", "cost": { - "input": 0.1, - "output": 0.5 + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "inception": { - "id": "inception", - "name": "Inception", - "display_name": "Inception", - "api": "https://api.inceptionlabs.ai/v1/", - "doc": "https://platform.inceptionlabs.ai/docs", - "models": [ + }, { - "id": "mercury-edit-2", - "name": "Mercury Edit 2", - "display_name": "Mercury Edit 2", + "id": "gemma-4-31b-it", + "name": "Gemma 4 31B", + "display_name": "Gemma 4 31B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 256000, "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-30", - "last_updated": "2026-03-30", - "cost": { - "input": 0.25, - "output": 0.75, - "cache_read": 0.025 - }, + "open_weights": true, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "type": "chat" }, { - "id": "mercury-2", - "name": "Mercury 2", - "display_name": "Mercury 2", + "id": "gemini-2.5-pro-preview-tts", + "name": "Gemini 2.5 Pro Preview TTS", + "display_name": "Gemini 2.5 Pro Preview TTS", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 128000, - "output": 50000 + "context": 8000, + "output": 16000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": false, "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "knowledge": "2025-01", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", "cost": { - "input": 0.25, - "output": 0.75, - "cache_read": 0.025 + "input": 1, + "output": 20 }, "type": "chat" - } - ] - }, - "openai": { - "id": "openai", - "name": "OpenAI", - "display_name": "OpenAI", - "doc": "https://platform.openai.com/docs/models", - "models": [ + }, { - "id": "gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "gemini-2.5-flash-preview-05-20", + "name": "Gemini 2.5 Flash Preview 05-20", + "display_name": "Gemini 2.5 Flash Preview 05-20", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-01", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.15, + "output": 0.6, + "cache_read": 0.0375 }, "type": "chat" }, { - "id": "gpt-4o-2024-05-13", - "name": "GPT-4o (2024-05-13)", - "display_name": "GPT-4o (2024-05-13)", + "id": "gemini-3.1-flash-image-preview", + "name": "Gemini 3.1 Flash Image (Preview)", + "display_name": "Gemini 3.1 Flash Image (Preview)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "knowledge": "2025-01", + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "cost": { - "input": 5, - "output": 15 + "input": 0.5, + "output": 60 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "o1-mini", - "name": "o1-mini", - "display_name": "o1-mini", + "id": "gemini-live-2.5-flash-preview-native-audio", + "name": "Gemini Live 2.5 Flash Preview Native Audio", + "display_name": "Gemini Live 2.5 Flash Preview Native Audio", "modalities": { "input": [ - "text" + "text", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 65536 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-09-18", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.5, + "output": 2, + "input_audio": 3, + "output_audio": 12 }, "type": "chat" }, { - "id": "gpt-5.2-pro", - "name": "GPT-5.2 Pro", - "display_name": "GPT-5.2 Pro", + "id": "gemini-2.5-pro-preview-06-05", + "name": "Gemini 2.5 Pro Preview 06-05", + "display_name": "Gemini 2.5 Pro Preview 06-05", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -106515,37 +113729,37 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2025-01", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "cost": { - "input": 21, - "output": 168 + "input": 1.25, + "output": 10, + "cache_read": 0.31 }, "type": "chat" }, { - "id": "text-embedding-3-large", - "name": "text-embedding-3-large", - "display_name": "text-embedding-3-large", + "id": "gemma-3n-e2b-it", + "name": "Gemma 3n 2B", + "display_name": "Gemma 3n 2B", "modalities": { "input": [ "text" @@ -106555,67 +113769,67 @@ ] }, "limit": { - "context": 8191, - "output": 3072 + "context": 8192, + "output": 2000 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-01", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "attachment": true, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.13, + "input": 0, "output": 0 }, - "type": "embedding" + "type": "chat" }, { - "id": "gpt-5.3-chat-latest", - "name": "GPT-5.3 Chat (latest)", - "display_name": "GPT-5.3 Chat (latest)", + "id": "gemma-3n-e4b-it", + "name": "Gemma 3n 4B", + "display_name": "Gemma 3n 4B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8192, + "output": 2000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "gemini-2.5-pro-preview-05-06", + "name": "Gemini 2.5 Pro Preview 05-06", + "display_name": "Gemini 2.5 Pro Preview 05-06", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -106623,10 +113837,10 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -106636,44 +113850,37 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "knowledge": "2025-01", + "release_date": "2025-05-06", + "last_updated": "2025-05-06", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 1.25, + "output": 10, + "cache_read": 0.31 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "gemini-2.5-flash-lite-preview-09-2025", + "name": "Gemini 2.5 Flash Lite Preview 09 2025", + "display_name": "Gemini 2.5 Flash Lite Preview 09 2025", "modalities": { "input": [ "text", @@ -106684,52 +113891,59 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": -1, + "min": 512, + "max": 24576 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, + "search": { + "supported": true, + "default": false + }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.25, - "output": 2, + "input": 0.1, + "output": 0.4, "cache_read": 0.025 }, "type": "chat" }, { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ "text", @@ -106740,56 +113954,66 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": -1, + "min": 512, + "max": 24576 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, + "search": { + "supported": true, + "default": false + }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.05, + "input": 0.1, "output": 0.4, - "cache_read": 0.005 + "cache_read": 0.01, + "input_audio": 0.3 }, "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "gemini-flash-lite-latest", + "name": "Gemini Flash-Lite Latest", + "display_name": "Gemini Flash-Lite Latest", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -106797,117 +114021,102 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 10, - "output": 30 - }, - "type": "chat" - }, - { - "id": "text-embedding-ada-002", - "name": "text-embedding-ada-002", - "display_name": "text-embedding-ada-002", - "modalities": { - "input": [ - "text" + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 1536 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2022-12", - "release_date": "2022-12-15", - "last_updated": "2022-12-15", - "cost": { - "input": 0.1, - "output": 0 + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, - "type": "embedding" + "type": "chat" }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "display_name": "Gemini 2.0 Flash Lite", "modalities": { "input": [ "text", @@ -106918,67 +114127,49 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "search": { + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "o3-pro", - "name": "o3-pro", - "display_name": "o3-pro", + "id": "gemini-3.1-pro-preview-customtools", + "name": "Gemini 3.1 Pro Preview Custom Tools", + "display_name": "Gemini 3.1 Pro Preview Custom Tools", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -106988,129 +114179,135 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ + "mode": "level", + "level": "high", + "level_options": [ "low", - "medium", "high" ], - "visibility": "hidden" + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-06-10", - "last_updated": "2025-06-10", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 20, - "output": 80 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "gemini-2.5-flash-image-preview", + "name": "Gemini 2.5 Flash Image Preview", + "display_name": "Gemini 2.5 Flash Image Preview", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "knowledge": "2025-06", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "input": 0.3, + "output": 30, + "cache_read": 0.075 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "o4-mini-deep-research", - "name": "o4-mini-deep-research", - "display_name": "o4-mini-deep-research", + "id": "gemini-2.5-flash-preview-tts", + "name": "Gemini 2.5 Flash Preview TTS", + "display_name": "Gemini 2.5 Flash Preview TTS", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 8000, + "output": 16000 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-06-26", - "last_updated": "2024-06-26", + "knowledge": "2025-01", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.5, + "output": 10 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 mini", - "display_name": "GPT-5.4 mini", + "id": "gemini-2.5-flash-lite-preview-06-17", + "name": "Gemini 2.5 Flash Lite Preview 06-17", + "display_name": "Gemini 2.5 Flash Lite Preview 06-17", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -107120,54 +114317,55 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025, + "input_audio": 0.3 }, "type": "chat" }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -107175,123 +114373,103 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2025-01", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "gpt-5.4-nano", - "name": "GPT-5.4 nano", - "display_name": "GPT-5.4 nano", + "id": "gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ "low", - "medium", "high" ], - "visibility": "hidden" + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 - }, - "type": "chat" - }, - { - "id": "gpt-image-1", - "name": "gpt-image-1", - "display_name": "gpt-image-1", - "modalities": { - "input": [ - "text", - "image" + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } ], - "output": [ - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-24", - "last_updated": "2025-04-24", - "type": "imageGeneration" + "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ "text", "image", + "video", + "audio", "pdf" ], "output": [ @@ -107299,10 +114477,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -107312,53 +114490,55 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ + "mode": "level", + "level": "high", + "level_options": [ + "minimal", "low", "medium", "high" ], - "visibility": "hidden" + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "input_audio": 1 }, "type": "chat" }, { - "id": "gpt-5.2-chat-latest", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", + "id": "gemini-live-2.5-flash", + "name": "Gemini Live 2.5 Flash", + "display_name": "Gemini Live 2.5 Flash", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { "context": 128000, - "output": 16384 + "output": 8000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -107366,20 +114546,21 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2025-01", + "release_date": "2025-09-01", + "last_updated": "2025-09-01", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.5, + "output": 2, + "input_audio": 3, + "output_audio": 12 }, "type": "chat" }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex mini", - "display_name": "GPT-5.1 Codex mini", + "id": "gemma-3-12b-it", + "name": "Gemma 3 12B", + "display_name": "Gemma 3 12B", "modalities": { "input": [ "text", @@ -107390,134 +114571,129 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32768, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "o1-preview", - "name": "o1-preview", - "display_name": "o1-preview", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": -1, + "min": 0, + "max": 24576 + } }, "extra_capabilities": { "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, + "search": { + "supported": true, + "default": false + }, + "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 }, "type": "chat" }, { - "id": "gpt-4o-2024-08-06", - "name": "GPT-4o (2024-08-06)", - "display_name": "GPT-4o (2024-08-06)", + "id": "gemini-2.5-flash-image", + "name": "Gemini 2.5 Flash Image", + "display_name": "Gemini 2.5 Flash Image", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-08-06", - "last_updated": "2024-08-06", + "knowledge": "2025-06", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.3, + "output": 30, + "cache_read": 0.075 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", "modalities": { "input": [ "text", @@ -107528,131 +114704,103 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "search": { + "supported": true, + "default": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "gpt-image-1-mini", - "name": "gpt-image-1-mini", - "display_name": "gpt-image-1-mini", + "id": "gemini-1.5-pro", + "name": "Gemini 1.5 Pro", + "display_name": "Gemini 1.5 Pro", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 8192, + "context": 1000000, "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-09-26", - "last_updated": "2025-09-26", - "type": "imageGeneration" + "knowledge": "2024-04", + "release_date": "2024-02-15", + "last_updated": "2024-02-15", + "cost": { + "input": 1.25, + "output": 5, + "cache_read": 0.3125 + }, + "type": "chat" }, { - "id": "o1", - "name": "o1", - "display_name": "o1", + "id": "gemini-embedding-001", + "name": "Gemini Embedding 001", + "display_name": "Gemini Embedding 001", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 2048, + "output": 3072 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "knowledge": "2025-05", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.15, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "gpt-5.4-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "gemma-3-4b-it", + "name": "Gemma 3 4B", + "display_name": "Gemma 3 4B", "modalities": { "input": [ "text", @@ -107663,139 +114811,107 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 32768, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 30, - "output": 180, - "context_over_200k": { - "input": 60, - "output": 270 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-3.5-turbo", - "name": "GPT-3.5-turbo", - "display_name": "GPT-3.5-turbo", + "id": "gemini-1.5-flash-8b", + "name": "Gemini 1.5 Flash-8B", + "display_name": "Gemini 1.5 Flash-8B", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 1000000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2021-09-01", - "release_date": "2023-03-01", - "last_updated": "2023-11-06", + "knowledge": "2024-04", + "release_date": "2024-10-03", + "last_updated": "2024-10-03", "cost": { - "input": 0.5, - "output": 1.5, - "cache_read": 1.25 + "input": 0.0375, + "output": 0.15, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "o3-deep-research", - "name": "o3-deep-research", - "display_name": "o3-deep-research", + "id": "gemini-2.0-flash-preview-image-generation", + "name": "Gemini 2.0 Flash Preview Image Generation", + "display_name": "Gemini 2.0 Flash Preview Image Generation", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 32000, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "search": { + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-06-26", - "last_updated": "2024-06-26", - "cost": { - "input": 10, - "output": 40, - "cache_read": 2.5 - }, "type": "chat" - }, + } + ] + }, + "sap-ai-core": { + "id": "sap-ai-core", + "name": "SAP AI Core", + "display_name": "SAP AI Core", + "doc": "https://help.sap.com/docs/sap-ai-core", + "models": [ { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "anthropic--claude-3-opus", + "name": "anthropic--claude-3-opus", + "display_name": "anthropic--claude-3-opus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -107803,80 +114919,92 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "knowledge": "2023-08-31", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "text-embedding-3-small", - "name": "text-embedding-3-small", - "display_name": "text-embedding-3-small", + "id": "gemini-2.5-pro", + "name": "gemini-2.5-pro", + "display_name": "gemini-2.5-pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8191, - "output": 1536 + "context": 1048576, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-01", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "knowledge": "2025-01", + "release_date": "2025-03-25", + "last_updated": "2025-06-05", "cost": { - "input": 0.02, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, - "type": "embedding" + "type": "chat" }, { - "id": "o1-pro", - "name": "o1-pro", - "display_name": "o1-pro", + "id": "anthropic--claude-4.5-haiku", + "name": "anthropic--claude-4.5-haiku", + "display_name": "anthropic--claude-4.5-haiku", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -107884,43 +115012,31 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2025-03-19", - "last_updated": "2025-03-19", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 150, - "output": 600 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "sonar", + "name": "sonar", + "display_name": "sonar", "modalities": { "input": [ "text" @@ -107930,85 +115046,65 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 30, - "output": 60 + "input": 1, + "output": 1 }, "type": "chat" }, { - "id": "gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "anthropic--claude-3-sonnet", + "name": "anthropic--claude-3-sonnet", + "display_name": "anthropic--claude-3-sonnet", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2023-08-31", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "anthropic--claude-3-haiku", + "name": "anthropic--claude-3-haiku", + "display_name": "anthropic--claude-3-haiku", "modalities": { "input": [ "text", @@ -108020,93 +115116,67 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 200000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "gpt-5.1-chat-latest", - "name": "GPT-5.1 Chat", - "display_name": "GPT-5.1 Chat", + "id": "anthropic--claude-3.5-sonnet", + "name": "anthropic--claude-3.5-sonnet", + "display_name": "anthropic--claude-3.5-sonnet", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gpt-5.3-codex-spark", - "name": "GPT-5.3 Codex Spark", - "display_name": "GPT-5.3 Codex Spark", + "id": "anthropic--claude-4.6-sonnet", + "name": "anthropic--claude-4.6-sonnet", + "display_name": "anthropic--claude-4.6-sonnet", "modalities": { "input": [ "text", @@ -108118,115 +115188,104 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 1000000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2025-08", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "chatgpt-image-latest", - "name": "chatgpt-image-latest", - "display_name": "chatgpt-image-latest", + "id": "gpt-4.1", + "name": "gpt-4.1", + "display_name": "gpt-4.1", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1047576, + "output": 32768 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 2, + "output": 8, + "cache_read": 0.5 + }, "type": "chat" }, { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "anthropic--claude-4.5-sonnet", + "name": "anthropic--claude-4.5-sonnet", + "display_name": "anthropic--claude-4.5-sonnet", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.03 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "gpt-4.1-mini", + "name": "gpt-4.1-mini", + "display_name": "gpt-4.1-mini", "modalities": { "input": [ "text", @@ -108238,98 +115297,70 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1047576, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "gpt-5-pro", - "name": "GPT-5 Pro", - "display_name": "GPT-5 Pro", + "id": "sonar-deep-research", + "name": "sonar-deep-research", + "display_name": "sonar-deep-research", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 272000 + "context": 128000, + "output": 32768 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "knowledge": "2025-01", + "release_date": "2025-02-01", + "last_updated": "2025-09-01", "cost": { - "input": 15, - "output": 120 + "input": 2, + "output": 8, + "reasoning": 3 }, "type": "chat" }, { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "gemini-2.5-flash-lite", + "name": "gemini-2.5-flash-lite", + "display_name": "gemini-2.5-flash-lite", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -108337,30 +115368,51 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.1, + "output": 0.4, + "cache_read": 0.01, + "input_audio": 0.3 }, "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "gpt-5-nano", + "name": "gpt-5-nano", + "display_name": "gpt-5-nano", "modalities": { "input": [ "text", @@ -108403,83 +115455,78 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", + "knowledge": "2024-05-30", "release_date": "2025-08-07", "last_updated": "2025-08-07", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "gpt-5-chat-latest", - "name": "GPT-5 Chat (latest)", - "display_name": "GPT-5 Chat (latest)", + "id": "gpt-5.4", + "name": "gpt-5.4", + "display_name": "gpt-5.4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1050000, "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-08-31", + "release_date": "2026-04-27", + "last_updated": "2026-04-27", "cost": { - "input": 1.25, - "output": 10 + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "gpt-image-1.5", - "name": "gpt-image-1.5", - "display_name": "gpt-image-1.5", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text", - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-25", - "last_updated": "2025-11-25", - "type": "imageGeneration" - }, - { - "id": "gpt-5.5-pro", - "name": "GPT-5.5 Pro", - "display_name": "GPT-5.5 Pro", + "id": "anthropic--claude-4.6-opus", + "name": "anthropic--claude-4.6-opus", + "display_name": "anthropic--claude-4.6-opus", "modalities": { "input": [ "text", @@ -108491,10 +115538,10 @@ ] }, "limit": { - "context": 1050000, + "context": 1000000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -108502,23 +115549,21 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "knowledge": "2025-05", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 30, - "output": 180, - "context_over_200k": { - "input": 60, - "output": 270 - } + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "anthropic--claude-3.7-sonnet", + "name": "anthropic--claude-3.7-sonnet", + "display_name": "anthropic--claude-3.7-sonnet", "modalities": { "input": [ "text", @@ -108530,34 +115575,58 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-10-31", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "gemini-2.5-flash", + "name": "gemini-2.5-flash", + "display_name": "gemini-2.5-flash", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -108565,30 +115634,52 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-01", + "release_date": "2025-04-17", + "last_updated": "2025-06-05", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "gpt-5-mini", + "name": "gpt-5-mini", + "display_name": "gpt-5-mini", "modalities": { "input": [ "text", @@ -108606,16 +115697,16 @@ "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", + "minimal", "low", "medium", "high" @@ -108631,106 +115722,69 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "gpt-4o-2024-11-20", - "name": "GPT-4o (2024-11-20)", - "display_name": "GPT-4o (2024-11-20)", + "id": "anthropic--claude-4-sonnet", + "name": "anthropic--claude-4-sonnet", + "display_name": "anthropic--claude-4-sonnet", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-11-20", - "last_updated": "2024-11-20", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gpt-image-2", - "name": "gpt-image-2", - "display_name": "gpt-image-2", + "id": "anthropic--claude-4.5-opus", + "name": "anthropic--claude-4.5-opus", + "display_name": "anthropic--claude-4.5-opus", "modalities": { "input": [ "text", - "image" - ], - "output": [ - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", - "cost": { - "input": 5, - "output": 30, - "cache_read": 1.25 - }, - "type": "imageGeneration" - } - ] - }, - "requesty": { - "id": "requesty", - "name": "Requesty", - "display_name": "Requesty", - "api": "https://router.requesty.ai/v1", - "doc": "https://requesty.ai/solution/llm-routing/models", - "models": [ - { - "id": "xai/grok-4-fast", - "name": "Grok 4 Fast", - "display_name": "Grok 4 Fast", - "modalities": { - "input": [ - "text" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, + "context": 200000, "output": 64000 }, "temperature": true, @@ -108741,21 +115795,21 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "knowledge": "2025-05", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05, - "cache_write": 0.2 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "xai/grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "sonar-pro", + "name": "sonar-pro", + "display_name": "sonar-pro", "modalities": { "input": [ "text", @@ -108766,127 +115820,103 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 200000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-09", - "last_updated": "2025-09-09", + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { "input": 3, - "output": 15, - "cache_read": 0.75, - "cache_write": 3 + "output": 15 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-max", - "name": "GPT-5.1-Codex-Max", - "display_name": "GPT-5.1-Codex-Max", + "id": "anthropic--claude-4.7-opus", + "name": "anthropic--claude-4.7-opus", + "display_name": "anthropic--claude-4.7-opus", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openai/gpt-5-chat", - "name": "GPT-5 Chat (latest)", - "display_name": "GPT-5 Chat (latest)", + "id": "anthropic--claude-4-opus", + "name": "anthropic--claude-4-opus", + "display_name": "anthropic--claude-4-opus", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 1.25, - "output": 10 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "openai/gpt-5.2-pro", - "name": "GPT-5.2 Pro", - "display_name": "GPT-5.2 Pro", + "id": "gpt-5", + "name": "gpt-5", + "display_name": "gpt-5", "modalities": { "input": [ "text", @@ -108911,11 +115941,12 @@ "supported": true, "default_enabled": true, "mode": "effort", - "effort": "high", + "effort": "medium", "effort_options": [ + "minimal", + "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -108928,19 +115959,29 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 21, - "output": 168 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" - }, + } + ] + }, + "scaleway": { + "id": "scaleway", + "name": "Scaleway", + "display_name": "Scaleway", + "api": "https://api.scaleway.ai/v1", + "doc": "https://www.scaleway.com/en/docs/generative-apis/", + "models": [ { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "pixtral-12b-2409", + "name": "Pixtral 12B 2409", + "display_name": "Pixtral 12B 2409", "modalities": { "input": [ "text", @@ -108952,163 +115993,90 @@ }, "limit": { "context": 128000, - "output": 32000 + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "release_date": "2024-09-25", + "last_updated": "2026-03-17", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "mistral-small-3.2-24b-instruct-2506", + "name": "Mistral Small 3.2 24B Instruct (2506)", + "display_name": "Mistral Small 3.2 24B Instruct (2506)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4000 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "release_date": "2025-06-20", + "last_updated": "2026-03-17", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 + "input": 0.15, + "output": 0.35 }, "type": "chat" }, { - "id": "openai/gpt-5.3-codex", - "name": "GPT-5.3-Codex", - "display_name": "GPT-5.3-Codex", + "id": "mistral-nemo-instruct-2407", + "name": "Mistral Nemo Instruct 2407", + "display_name": "Mistral Nemo Instruct 2407", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "open_weights": true, + "release_date": "2024-07-25", + "last_updated": "2026-03-17", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o Mini", - "display_name": "GPT-4o Mini", + "id": "gemma-3-27b-it", + "name": "Gemma-3-27B-IT", + "display_name": "Gemma-3-27B-IT", "modalities": { "input": [ "text", @@ -109119,77 +116087,74 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 40000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2026-03-17", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "input": 0.25, + "output": 0.5 }, "type": "chat" }, { - "id": "openai/gpt-5.1-chat", - "name": "GPT-5.1 Chat", - "display_name": "GPT-5.1 Chat", + "id": "bge-multilingual-gemma2", + "name": "BGE Multilingual Gemma2", + "display_name": "BGE Multilingual Gemma2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8191, + "output": 3072 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2024-07-26", + "last_updated": "2025-06-15", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.1, + "output": 0 }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "o4 Mini", - "display_name": "o4 Mini", + "id": "qwen3.5-397b-a17b", + "name": "Qwen3.5 397B A17B", + "display_name": "Qwen3.5 397B A17B", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -109200,159 +116165,135 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "openai/gpt-5.2-codex", - "name": "GPT-5.2-Codex", - "display_name": "GPT-5.2-Codex", + "id": "voxtral-small-24b-2507", + "name": "Voxtral Small 24B 2507", + "display_name": "Voxtral Small 24B 2507", "modalities": { "input": [ "text", - "image" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "open_weights": true, + "release_date": "2025-07-01", + "last_updated": "2026-03-17", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.15, + "output": 0.35 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-mini", - "name": "GPT-5.1-Codex-Mini", - "display_name": "GPT-5.1-Codex-Mini", + "id": "qwen3-embedding-8b", + "name": "Qwen3 Embedding 8B", + "display_name": "Qwen3 Embedding 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 100000 + "context": 32768, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "attachment": false, + "open_weights": false, + "release_date": "2025-25-11", + "last_updated": "2026-03-17", + "cost": { + "input": 0.1, + "output": 0 + }, + "type": "embedding" + }, + { + "id": "whisper-large-v3", + "name": "Whisper Large v3", + "display_name": "Whisper Large v3", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-09", + "release_date": "2023-09-01", + "last_updated": "2026-03-17", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.003, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-5-image", - "name": "GPT-5 Image", - "display_name": "GPT-5 Image", + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32000, + "output": 8196 }, "temperature": true, "tool_call": true, @@ -109360,355 +116301,240 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-10-14", - "last_updated": "2025-10-14", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2026-03-17", "cost": { - "input": 5, - "output": 10, - "cache_read": 1.25 + "input": 0.9, + "output": 0.9 }, "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 260000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": true, + "release_date": "2025-07-01", + "last_updated": "2026-03-17", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.75, + "output": 2.25 }, "type": "chat" }, { - "id": "openai/gpt-5.4-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder 30B-A3B Instruct", + "display_name": "Qwen3-Coder 30B-A3B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2026-03-17", "cost": { - "input": 30, - "output": 180, - "cache_read": 30 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "openai/gpt-5-codex", - "name": "GPT-5 Codex", - "display_name": "GPT-5 Codex", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 100000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2026-03-17", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.9, + "output": 0.9 }, "type": "chat" }, { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "gpt-oss-120b", + "name": "GPT-OSS 120B", + "display_name": "GPT-OSS 120B", "modalities": { "input": [ - "text", - "audio", - "image", - "video" + "text" ], "output": [ - "text", - "audio", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "release_date": "2024-01-01", + "last_updated": "2026-03-17", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1 Mini", - "display_name": "GPT-4.1 Mini", + "id": "devstral-2-123b-instruct-2512", + "name": "Devstral 2 123B Instruct (2512)", + "display_name": "Devstral 2 123B Instruct (2512)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "release_date": "2026-01-07", + "last_updated": "2026-03-17", "cost": { "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "output": 2 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex", - "name": "GPT-5.1-Codex", - "display_name": "GPT-5.1-Codex", + "id": "llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2026-03-17", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.2, + "output": 0.2 }, "type": "chat" - }, + } + ] + }, + "opencode": { + "id": "opencode", + "name": "OpenCode Zen", + "display_name": "OpenCode Zen", + "api": "https://opencode.ai/zen/v1", + "doc": "https://opencode.ai/docs/zen", + "models": [ { - "id": "google/gemini-3-flash-preview", - "name": "Gemini 3 Flash", - "display_name": "Gemini 3 Flash", + "id": "minimax-m2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -109719,53 +116545,42 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, + "attachment": false, + "open_weights": true, "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "cache_write": 1 + "input": 0.3, + "output": 1.2, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "google/gemini-3-pro-preview", - "name": "Gemini 3 Pro", - "display_name": "Gemini 3 Pro", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", "image", - "audio", - "video", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, @@ -109777,51 +116592,42 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "cache_write": 4.5 + "input": 0.6, + "output": 3, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ "text", "image", - "audio", - "video", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, @@ -109833,38 +116639,29 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.55 + "input": 0.2, + "output": 1.2, + "cache_read": 0.02, + "cache_write": 0.25 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4-5", + "id": "claude-haiku-4-5", "name": "Claude Haiku 4.5", "display_name": "Claude Haiku 4.5", "modalities": { @@ -109879,7 +116676,7 @@ }, "limit": { "context": 200000, - "output": 62000 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -109894,7 +116691,7 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-01", + "knowledge": "2025-02-28", "release_date": "2025-10-15", "last_updated": "2025-10-15", "cost": { @@ -109906,180 +116703,107 @@ "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5 - } + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "anthropic/claude-3-7-sonnet", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "kimi-k2.5-free", + "name": "Kimi K2.5 Free", + "display_name": "Kimi K2.5 Free", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", + "interleaved": true, + "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-01", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" - }, - { - "id": "anthropic/claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 64000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "gemini-3-pro", + "name": "Gemini 3 Pro", + "display_name": "Gemini 3 Pro", "modalities": { "input": [ "text", "image", + "video", + "audio", "pdf" ], "output": [ @@ -110087,8 +116811,8 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -110096,125 +116820,53 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" - }, - { - "id": "anthropic/claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 128000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": false - }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ "low", - "medium", "high" ], - "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25, + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], "context_over_200k": { - "input": 10, - "output": 37.5, - "cache_read": 1, - "cache_write": 12.5 + "input": 4, + "output": 18, + "cache_read": 0.4 } }, "type": "chat" }, { - "id": "openai/gpt-5.2-chat", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 16384 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", - "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 - }, - "type": "chat" - }, - { - "id": "openai/gpt-5.2", + "id": "gpt-5.2", "name": "GPT-5.2", "display_name": "GPT-5.2", "modalities": { @@ -110271,76 +116923,59 @@ "type": "chat" }, { - "id": "openai/gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "glm-5-free", + "name": "GLM-5 Free", + "display_name": "GLM-5 Free", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "openai/gpt-5-pro", - "name": "GPT-5 Pro", - "display_name": "GPT-5 Pro", + "id": "gpt-5.4-nano", + "name": "GPT-5.4 Nano", + "display_name": "GPT-5.4 Nano", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -110348,20 +116983,27 @@ }, "limit": { "context": 400000, - "output": 272000 + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], "verbosity": "medium", "verbosity_options": [ "low", @@ -110373,59 +117015,63 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 15, - "output": 120 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "minimax-m2.1-free", + "name": "MiniMax M2.1 Free", + "display_name": "MiniMax M2.1 Free", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "gpt-5.5-pro", + "name": "GPT-5.5 Pro", + "display_name": "GPT-5.5 Pro", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -110433,10 +117079,10 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -110444,87 +117090,81 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2025-12-01", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31, - "cache_write": 2.375, - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 30, + "output": 180, + "cache_read": 30 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex Mini", + "display_name": "GPT-5.1 Codex Mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", @@ -110536,7 +117176,7 @@ ] }, "limit": { - "context": 200000, + "context": 1000000, "output": 64000 }, "temperature": true, @@ -110545,36 +117185,58 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { "input": 3, "output": 15, "cache_read": 0.3, - "cache_write": 3.75 + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5 + } }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "mimo-v2-flash-free", + "name": "MiMo V2 Flash Free", + "display_name": "MiMo V2 Flash Free", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, - "limit": { - "context": 1000000, - "output": 64000 + "limit": { + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -110584,40 +117246,34 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" - } - ] - }, - "digitalocean": { - "id": "digitalocean", - "name": "DigitalOcean", - "display_name": "DigitalOcean", - "api": "https://inference.do-ai.run/v1", - "doc": "https://docs.digitalocean.com/products/gradient-ai-platform/details/models/", - "models": [ + }, { - "id": "openai-gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "gpt-5.3-codex-spark", + "name": "GPT-5.3 Codex Spark", + "display_name": "GPT-5.3 Codex Spark", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -110625,29 +117281,51 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "knowledge": "2025-08-31", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "multi-qa-mpnet-base-dot-v1", - "name": "Multi-QA-mpnet-base-dot-v1", - "display_name": "Multi-QA-mpnet-base-dot-v1", + "id": "trinity-large-preview-free", + "name": "Trinity Large Preview", + "display_name": "Trinity Large Preview", "modalities": { "input": [ "text" @@ -110657,28 +117335,29 @@ ] }, "limit": { - "context": 512, - "output": 768 + "context": 131072, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2021-08-30", - "last_updated": "2026-04-16", + "knowledge": "2025-06", + "release_date": "2026-01-28", + "last_updated": "2026-01-28", "cost": { - "input": 0.009, + "input": 0, "output": 0 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "deepseek-v4-flash-free", + "name": "DeepSeek V4 Flash Free", + "display_name": "DeepSeek V4 Flash Free", "modalities": { "input": [ "text" @@ -110688,10 +117367,10 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 200000, + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -110710,54 +117389,76 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-04-16", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.5, - "output": 2.7 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "nemotron-3-nano-omni", - "name": "Nemotron Nano 3 Omni", - "display_name": "Nemotron Nano 3 Omni", + "id": "gpt-5-codex", + "name": "GPT-5 Codex", + "display_name": "GPT-5 Codex", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-28", - "last_updated": "2026-04-30", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.5, - "output": 0.9 + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 }, "type": "chat" }, { - "id": "llama3-8b-instruct", - "name": "Llama 3.1 Instruct (8B)", - "display_name": "Llama 3.1 Instruct (8B)", + "id": "minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -110767,103 +117468,98 @@ ] }, "limit": { - "context": 131072, + "context": 204800, "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2025-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.198, - "output": 0.198 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "anthropic-claude-opus-4.7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "mimo-v2-pro-free", + "name": "MiMo V2 Pro Free", + "display_name": "MiMo V2 Pro Free", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 1048576, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], "interleaved": true, "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "anthropic-claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -110871,60 +117567,27 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.3, - "cache_write": 3.75 + "extra_capabilities": { + "reasoning": { + "supported": true } }, - "type": "chat" - }, - { - "id": "wan2-2-t2v-a14b", - "name": "Wan2.2-T2V-A14B", - "display_name": "Wan2.2-T2V-A14B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "video" - ] - }, - "limit": { - "context": 100, - "output": 1 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, "attachment": false, "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2026-04-30", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { "input": 0.6, - "output": 0 + "output": 2.2, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "qwen-2.5-14b-instruct", - "name": "Qwen 2.5 14B Instruct", - "display_name": "Qwen 2.5 14B Instruct", + "id": "ling-2.6-flash-free", + "name": "Ling 2.6 Flash Free", + "display_name": "Ling 2.6 Flash Free", "modalities": { "input": [ "text" @@ -110934,8 +117597,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262100, + "output": 32800 }, "temperature": true, "tool_call": true, @@ -110944,15 +117607,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-09-19", - "last_updated": "2024-09-19", + "knowledge": "2025-06", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "openai-gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", @@ -110965,30 +117632,57 @@ }, "limit": { "context": 1000000, - "output": 128000 + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 2.5, + "input": 3, "output": 15, - "cache_read": 0.25 + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "qwen3.5-397b-a17b", - "name": "Qwen 3.5 397B A17B", - "display_name": "Qwen 3.5 397B A17B", + "id": "glm-4.7-free", + "name": "GLM-4.7 Free", + "display_name": "GLM-4.7 Free", "modalities": { "input": [ "text" @@ -110998,8 +117692,8 @@ ] }, "limit": { - "context": 262144, - "output": 81920 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -111020,54 +117714,67 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-15", - "last_updated": "2026-04-30", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.55, - "output": 3.5 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "openai-o3", - "name": "o3", - "display_name": "o3", + "id": "qwen3.6-plus-free", + "name": "Qwen3.6 Plus Free", + "display_name": "Qwen3.6 Plus Free", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "e5-large-v2", - "name": "E5 Large v2", - "display_name": "E5 Large v2", + "id": "minimax-m2.7", + "name": "MiniMax M2.7", + "display_name": "MiniMax M2.7", "modalities": { "input": [ "text" @@ -111077,74 +117784,131 @@ ] }, "limit": { - "context": 512, - "output": 1024 + "context": 204800, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 + }, + "type": "chat" + }, + { + "id": "qwen3-coder", + "name": "Qwen3 Coder", + "display_name": "Qwen3 Coder", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65536 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2023-05-19", - "last_updated": "2026-04-30", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.02, - "output": 0 + "input": 0.45, + "output": 1.8 }, "type": "chat" }, { - "id": "openai-gpt-5.2-pro", - "name": "GPT-5.2 pro", - "display_name": "GPT-5.2 pro", + "id": "claude-opus-4-1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 21, - "output": 168 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM 5", - "display_name": "GLM 5", + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 128000 + "context": 262144, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -111161,20 +117925,23 @@ ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-04-16", + "attachment": true, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 1, - "output": 3.2 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 0.625 }, "type": "chat" }, { - "id": "openai-gpt-5.4-nano", - "name": "GPT-5.4 nano", - "display_name": "GPT-5.4 nano", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ "text", @@ -111192,83 +117959,101 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 - }, - "type": "chat" - }, - { - "id": "mistral-7b-instruct-v0.3", - "name": "Mistral 7B Instruct v0.3", - "display_name": "Mistral 7B Instruct v0.3", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32768, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 }, - "attachment": false, - "open_weights": true, - "release_date": "2024-05-22", - "last_updated": "2024-05-22", "type": "chat" }, { - "id": "llama3.3-70b-instruct", - "name": "Llama 3.3 Instruct 70B", - "display_name": "Llama 3.3 Instruct 70B", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.65, - "output": 0.65 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "mistral-3-14B", - "name": "Ministral 3 14B Instruct", - "display_name": "Ministral 3 14B Instruct", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -111279,64 +118064,99 @@ }, "limit": { "context": 262144, - "output": 128000 + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2025-12-15", - "last_updated": "2026-04-30", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.4, + "output": 2.5, + "cache_read": 0.4 }, "type": "chat" }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "gpt-5.4-mini", + "name": "GPT-5.4 Mini", + "display_name": "GPT-5.4 Mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-01-30", - "last_updated": "2025-01-30", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.99, - "output": 0.99 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "alibaba-qwen3-32b", - "name": "Qwen3-32B", - "display_name": "Qwen3-32B", + "id": "hy3-preview-free", + "name": "Hy3 preview Free", + "display_name": "Hy3 preview Free", "modalities": { "input": [ "text" @@ -111346,8 +118166,8 @@ ] }, "limit": { - "context": 131000, - "output": 40960 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -111357,18 +118177,20 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-04-30", - "last_updated": "2026-04-16", + "knowledge": "2025-06", + "release_date": "2026-04-20", + "last_updated": "2026-04-20", "cost": { - "input": 0.25, - "output": 0.55 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "anthropic-claude-opus-4.5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", @@ -111380,20 +118202,44 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { "input": 5, "output": 25, @@ -111403,13 +118249,15 @@ "type": "chat" }, { - "id": "openai-o1", - "name": "o1", - "display_name": "o1", + "id": "gemini-3-flash", + "name": "Gemini 3 Flash", + "display_name": "Gemini 3 Flash", "modalities": { "input": [ "text", "image", + "video", + "audio", "pdf" ], "output": [ @@ -111417,97 +118265,89 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.5, + "output": 3, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "anthropic-claude-3-opus", - "name": "Claude 3 Opus", - "display_name": "Claude 3 Opus", + "id": "minimax-m2.5-free", + "name": "MiniMax M2.5 Free", + "display_name": "MiniMax M2.5 Free", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-08", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", - "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" - }, - { - "id": "stable-diffusion-3.5-large", - "name": "Stable Diffusion 3.5 Large", - "display_name": "Stable Diffusion 3.5 Large", - "modalities": { - "input": [ - "text" - ], - "output": [ - "image" - ] - }, - "limit": { - "context": 256, - "output": 1 + "supported": true, + "default": true }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2024-10-22", - "last_updated": "2026-04-30", + "knowledge": "2025-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.08, - "output": 0 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "openai-gpt-5-nano", - "name": "GPT-5 nano", - "display_name": "GPT-5 nano", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ "text", @@ -111525,57 +118365,45 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 - }, - "type": "chat" - }, - { - "id": "llama-4-maverick", - "name": "Llama 4 Maverick 17B 128E Instruct", - "display_name": "Llama 4 Maverick 17B 128E Instruct", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 16384 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "default": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2026-04-30", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.25, - "output": 0.87 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "anthropic-claude-4.5-sonnet", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "gpt-5.4-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ "text", @@ -111587,38 +118415,51 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.3, - "cache_write": 3.75 - } + "input": 30, + "output": 180, + "cache_read": 30 }, "type": "chat" }, { - "id": "qwen3-embedding-0.6b", - "name": "Qwen3 Embedding 0.6B", - "display_name": "Qwen3 Embedding 0.6B", + "id": "big-pickle", + "name": "Big Pickle", + "display_name": "Big Pickle", "modalities": { "input": [ "text" @@ -111628,39 +118469,55 @@ ] }, "limit": { - "context": 8000, - "output": 1024 + "context": 200000, + "output": 128000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, - "release_date": "2025-06-03", - "last_updated": "2026-04-16", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-10-17", + "last_updated": "2025-10-17", "cost": { - "input": 0.04, - "output": 0 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, - "type": "embedding" + "type": "chat" }, { - "id": "anthropic-claude-4.5-haiku", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 1000000, "output": 64000 }, "temperature": true, @@ -111671,90 +118528,133 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 1, - "output": 5, - "cache_read": 1, - "cache_write": 1.25 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5 + } }, "type": "chat" }, { - "id": "gte-large-en-v1.5", - "name": "GTE Large (v1.5)", - "display_name": "GTE Large (v1.5)", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1024 + "context": 400000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-03-27", - "last_updated": "2026-04-16", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.09, - "output": 0 + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 }, "type": "chat" }, { - "id": "openai-gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "kimi-k2", + "name": "Kimi K2", + "display_name": "Kimi K2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.4, + "output": 2.5, + "cache_read": 0.4 }, "type": "chat" }, { - "id": "anthropic-claude-3.5-haiku", - "name": "Claude 3.5 Haiku", - "display_name": "Claude 3.5 Haiku", + "id": "claude-3-5-haiku", + "name": "Claude Haiku 3.5", + "display_name": "Claude Haiku 3.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -111769,11 +118669,11 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-11-05", - "last_updated": "2024-11-05", + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { "input": 0.8, "output": 4, @@ -111783,13 +118683,14 @@ "type": "chat" }, { - "id": "openai-gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -111805,11 +118706,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { "input": 1.75, "output": 14, @@ -111818,9 +118740,9 @@ "type": "chat" }, { - "id": "deepseek-3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "grok-code", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ "text" @@ -111830,8 +118752,8 @@ ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -111839,60 +118761,22 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-12-02", - "last_updated": "2026-04-30", + "attachment": true, + "open_weights": false, + "release_date": "2025-08-20", + "last_updated": "2025-08-20", "cost": { - "input": 0.5, - "output": 1.6 - }, - "type": "chat" - }, - { - "id": "nemotron-3-nano-30b", - "name": "Nemotron 3 Nano 30B A3B", - "display_name": "Nemotron 3 Nano 30B A3B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 262144 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", "type": "chat" }, { - "id": "anthropic-claude-opus-4", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", @@ -111904,32 +118788,52 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-08-31", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "openai-gpt-oss-20b", - "name": "gpt-oss-20b", - "display_name": "gpt-oss-20b", + "id": "ring-2.6-1t-free", + "name": "Ring 2.6 1T Free", + "display_name": "Ring 2.6 1T Free", "modalities": { "input": [ "text" @@ -111939,8 +118843,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262000, + "output": 66000 }, "temperature": true, "tool_call": true, @@ -111948,53 +118852,32 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-08-05", - "last_updated": "2026-04-16", - "cost": { - "input": 0.05, - "output": 0.45 - }, - "type": "chat" - }, - { - "id": "qwen3-coder-flash", - "name": "Qwen3 Coder Flash", - "display_name": "Qwen3 Coder Flash", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 65536 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2026-04-30", + "knowledge": "2025-06", + "release_date": "2026-05-08", + "last_updated": "2026-05-08", "cost": { - "input": 0.45, - "output": 1.7 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai-o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "nemotron-3-super-free", + "name": "Nemotron 3 Super Free", + "display_name": "Nemotron 3 Super Free", "modalities": { "input": [ "text" @@ -112004,31 +118887,42 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 204800, + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "open_weights": true, + "knowledge": "2026-02", + "release_date": "2026-03-11", + "last_updated": "2026-03-11", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "openai-gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -112038,7 +118932,7 @@ ] }, "limit": { - "context": 131072, + "context": 204800, "output": 131072 }, "temperature": true, @@ -112060,63 +118954,31 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-08-05", - "last_updated": "2026-04-16", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.1, - "output": 0.7 + "input": 0.6, + "output": 2.2, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "gemma-4-31B-it", - "name": "Gemma 4 31B", - "display_name": "Gemma 4 31B", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 256000, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-22", - "last_updated": "2026-04-30", - "cost": { - "input": 0.18, - "output": 0.5 - }, - "type": "chat" - }, - { - "id": "nemotron-nano-12b-v2-vl", - "name": "Nemotron Nano 12B v2 VL", - "display_name": "Nemotron Nano 12B v2 VL", - "modalities": { - "input": [ - "text", - "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -112124,25 +118986,39 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-12-01", - "last_updated": "2026-04-30", + "knowledge": "2025-04", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.2, - "output": 0.6 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "anthropic-claude-4.1-opus", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "gemini-3.1-pro", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ "text", "image", + "video", + "audio", "pdf" ], "output": [ @@ -112150,8 +119026,8 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -112159,16 +119035,48 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, @@ -112179,7 +119087,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" @@ -112187,9 +119096,9 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -112208,47 +119117,68 @@ }, "attachment": true, "open_weights": true, - "knowledge": "2025-01", + "knowledge": "2024-10", "release_date": "2026-04-21", "last_updated": "2026-04-21", "cost": { "input": 0.95, - "output": 4 + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "openai-gpt-image-2", - "name": "GPT Image 2", - "display_name": "GPT Image 2", + "id": "mimo-v2-omni-free", + "name": "MiMo V2 Omni Free", + "display_name": "MiMo V2 Omni Free", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "release_date": "2025-04-24", - "last_updated": "2025-04-24", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 + }, "type": "chat" }, { - "id": "anthropic-claude-4.6-sonnet", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ "text", @@ -112260,7 +119190,7 @@ ] }, "limit": { - "context": 1000000, + "context": 200000, "output": 64000 }, "temperature": true, @@ -112269,29 +119199,28 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.3, - "cache_write": 3.75 - } + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openai-gpt-5-mini", - "name": "GPT-5 mini", - "display_name": "GPT-5 mini", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", @@ -112311,22 +119240,43 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", + "knowledge": "2024-09-30", "release_date": "2025-08-07", "last_updated": "2025-08-07", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 }, "type": "chat" }, { - "id": "anthropic-claude-haiku-4.5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", @@ -112338,45 +119288,84 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 1, - "output": 5, - "cache_read": 1, - "cache_write": 1.25 + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + }, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -112385,169 +119374,171 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 1.74, - "output": 3.48 - }, - "type": "chat" - }, - { - "id": "ministral-3-8b-instruct-2512", - "name": "Ministral 3 8B", - "display_name": "Ministral 3 8B", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" + "input": 5, + "output": 30, + "cache_read": 0.5, + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + }, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } ] }, - "limit": { - "context": 262144, - "output": 262144 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2025-12-15", - "last_updated": "2025-12-15", "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, + "context": 1000000, "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-08", - "release_date": "2026-02-12", - "last_updated": "2026-04-16", - "cost": { - "input": 0.3, - "output": 1.2 - }, - "type": "chat" - }, - { - "id": "openai-gpt-image-1", - "name": "GPT Image 1", - "display_name": "GPT Image 1", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, "attachment": true, "open_weights": false, - "release_date": "2025-04-24", - "last_updated": "2025-04-24", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { "input": 5, - "output": 40, - "cache_read": 1.25 + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" - }, + } + ] + }, + "mixlayer": { + "id": "mixlayer", + "name": "Mixlayer", + "display_name": "Mixlayer", + "api": "https://models.mixlayer.ai/v1", + "doc": "https://docs.mixlayer.com", + "models": [ { - "id": "openai-gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "qwen/qwen3.5-122b-a10b", + "name": "Qwen3.5 122B A10B", + "display_name": "Qwen3.5 122B A10B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-30", - "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0.4, + "output": 3.2 + }, "type": "chat" }, { - "id": "nvidia-nemotron-3-super-120b", - "name": "Nemotron-3-Super-120B", - "display_name": "Nemotron-3-Super-120B", + "id": "qwen/qwen3.5-397b-a17b", + "name": "Qwen3.5 397B A17B", + "display_name": "Qwen3.5 397B A17B", "modalities": { "input": [ "text" @@ -112556,9 +119547,9 @@ "text" ] }, - "limit": { - "context": 256000, - "output": 32768 + "limit": { + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -112566,55 +119557,74 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2026-02", - "release_date": "2026-03-11", - "last_updated": "2026-04-16", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.3, - "output": 0.65 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "openai-gpt-5.4-pro", - "name": "GPT-5.4 pro", - "display_name": "GPT-5.4 pro", + "id": "qwen/qwen3.5-9b", + "name": "Qwen3.5 9B", + "display_name": "Qwen3.5 9B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 30, - "output": 180 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "all-mini-lm-l6-v2", - "name": "All-MiniLM-L6-v2", - "display_name": "All-MiniLM-L6-v2", + "id": "qwen/qwen3.5-35b-a3b", + "name": "Qwen3.5 35B A3B", + "display_name": "Qwen3.5 35B A3B", "modalities": { "input": [ "text" @@ -112624,28 +119634,40 @@ ] }, "limit": { - "context": 256, - "output": 384 + "context": 262144, + "output": 262144 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2021-08-30", - "last_updated": "2026-04-16", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.009, - "output": 0 + "input": 0.25, + "output": 1.3 }, "type": "chat" }, { - "id": "bge-m3", - "name": "BGE M3", - "display_name": "BGE M3", + "id": "qwen/qwen3.5-27b", + "name": "Qwen3.5 27B", + "display_name": "Qwen3.5 27B", "modalities": { "input": [ "text" @@ -112655,28 +119677,49 @@ ] }, "limit": { - "context": 8192, - "output": 1024 + "context": 262144, + "output": 262144 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2024-01-30", - "last_updated": "2026-04-30", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.02, - "output": 0 + "input": 0.3, + "output": 2.4 }, - "type": "embedding" - }, + "type": "chat" + } + ] + }, + "perplexity-agent": { + "id": "perplexity-agent", + "name": "Perplexity Agent", + "display_name": "Perplexity Agent", + "api": "https://api.perplexity.ai/v1", + "doc": "https://docs.perplexity.ai/docs/agent-api/models", + "models": [ { - "id": "openai-gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", @@ -112694,39 +119737,60 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "anthropic-claude-opus-4.6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -112736,97 +119800,108 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", + "mode": "effort", + "effort": "none", "effort_options": [ + "none", "low", "medium", "high" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25, - "context_over_200k": { - "input": 10, - "output": 37.5, - "cache_read": 0.5, - "cache_write": 6.25 - } + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai-gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "openai/gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { "input": 2.5, - "output": 10, - "cache_read": 1.25 + "output": 15, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "openai-gpt-5.4-mini", - "name": "GPT-5.4 mini", - "display_name": "GPT-5.4 mini", + "id": "openai/gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1050000, "output": 128000 }, "temperature": false, @@ -112835,22 +119910,43 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 5, + "output": 30, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "openai-gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ "text", @@ -112870,22 +119966,43 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", + "knowledge": "2024-05-30", "release_date": "2025-08-07", "last_updated": "2025-08-07", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "arcee-trinity-large-thinking", - "name": "Trinity Large Thinking", - "display_name": "Trinity Large Thinking", + "id": "nvidia/nemotron-3-super-120b-a12b", + "name": "Nemotron 3 Super 120B", + "display_name": "Nemotron 3 Super 120B", "modalities": { "input": [ "text" @@ -112895,8 +120012,8 @@ ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 1000000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -112906,113 +120023,106 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-16", + "knowledge": "2026-02", + "release_date": "2026-03-11", + "last_updated": "2026-03-11", "cost": { "input": 0.25, - "output": 0.9, - "cache_read": 0.06 + "output": 2.5 }, "type": "chat" }, { - "id": "mistral-nemo-instruct-2407", - "name": "Mistral Nemo Instruct", - "display_name": "Mistral Nemo Instruct", + "id": "anthropic/claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.3, - "output": 0.3 + "input": 1, + "output": 5, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "deepseek-v3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "anthropic/claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-12-26", - "last_updated": "2025-03-24", - "type": "chat" - }, - { - "id": "bge-reranker-v2-m3", - "name": "BGE Reranker v2 M3", - "display_name": "BGE Reranker v2 M3", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 1 + "supported": true, + "default": true }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true + } }, - "attachment": false, - "open_weights": true, - "release_date": "2024-03-12", - "last_updated": "2026-04-30", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.01, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3 }, - "type": "rerank" + "type": "chat" }, { - "id": "anthropic-claude-3.7-sonnet", - "name": "Claude 3.7 Sonnet", - "display_name": "Claude 3.7 Sonnet", + "id": "anthropic/claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -113032,99 +120142,104 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "budget", + "mode": "mixed", "budget": { "min": 1024, "unit": "tokens" }, - "interleaved": false, - "summaries": false, - "visibility": "full", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" ], "notes": [ - "Anthropic uses thinking budget tokens" + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { "input": 3, "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" - }, - { - "id": "qwen3-tts-voicedesign", - "name": "Qwen3 TTS VoiceDesign", - "display_name": "Qwen3 TTS VoiceDesign", - "modalities": { - "input": [ - "text" - ], - "output": [ - "audio" - ] - }, - "limit": { - "context": 32768, - "output": 1 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false + "cache_read": 0.3 }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-21", - "last_updated": "2026-04-30", "type": "chat" }, { - "id": "openai-gpt-image-1.5", - "name": "GPT Image 1.5", - "display_name": "GPT Image 1.5", + "id": "anthropic/claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1000000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-11-25", - "last_updated": "2025-11-25", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { "input": 5, - "output": 10, - "cache_read": 1 + "output": 25, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "openai-gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "anthropic/claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", @@ -113136,35 +120251,62 @@ ] }, "limit": { - "context": 400000, + "context": 200000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", + "knowledge": "2025-05-31", "release_date": "2026-02-05", "last_updated": "2026-02-05", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 5, + "output": 25, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "anthropic-claude-3.5-sonnet", - "name": "Claude 3.5 Sonnet", - "display_name": "Claude 3.5 Sonnet", + "id": "anthropic/claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -113172,290 +120314,310 @@ }, "limit": { "context": 200000, - "output": 8192 + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-06-20", - "last_updated": "2024-10-22", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" - }, - { - "id": "fal-ai/fast-sdxl", - "name": "Fast SDXL", - "display_name": "Fast SDXL", - "modalities": { - "input": [ - "text" - ], - "output": [ - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2023-07-26", - "last_updated": "2026-04-16", - "type": "chat" - }, - { - "id": "fal-ai/flux/schnell", - "name": "FLUX.1 [schnell]", - "display_name": "FLUX.1 [schnell]", - "modalities": { - "input": [ - "text" - ], - "output": [ - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-08-01", - "last_updated": "2026-04-16", - "type": "chat" - }, - { - "id": "fal-ai/elevenlabs/tts/multilingual-v2", - "name": "ElevenLabs Multilingual TTS v2", - "display_name": "ElevenLabs Multilingual TTS v2", - "modalities": { - "input": [ - "text" - ], - "output": [ - "audio" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false + "input": 5, + "output": 25, + "cache_read": 0.5 }, - "attachment": false, - "open_weights": false, - "release_date": "2023-08-22", - "last_updated": "2026-04-16", "type": "chat" }, { - "id": "fal-ai/stable-audio-25/text-to-audio", - "name": "Stable Audio 2.5 (Text-to-Audio)", - "display_name": "Stable Audio 2.5 (Text-to-Audio)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "audio" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-10-08", - "last_updated": "2026-04-16", - "type": "chat" - } - ] - }, - "vultr": { - "id": "vultr", - "name": "Vultr", - "display_name": "Vultr", - "api": "https://api.vultrinference.com/v1", - "doc": "https://api.vultrinference.com/", - "models": [ - { - "id": "MiniMax-M2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 194000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-09", - "release_date": "2025-02-11", - "last_updated": "2025-02-11", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.3, - "output": 1.2 + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + } }, "type": "chat" }, { - "id": "GLM-5-FP8", - "name": "GLM 5 FP8", - "display_name": "GLM 5 FP8", + "id": "google/gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.85, - "output": 3.1 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "DeepSeek-V3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "google/gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 127000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.55, - "output": 1.65 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "tiers": [ + { + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 0.5, + "output": 3, + "cache_read": 0.05 + } }, "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 129000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03 }, "type": "chat" }, - { - "id": "Kimi-K2.5", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + { + "id": "perplexity/sonar", + "name": "Sonar", + "display_name": "Sonar", "modalities": { "input": [ "text" @@ -113465,79 +120627,69 @@ ] }, "limit": { - "context": 254000, - "output": 32768 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "open_weights": false, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 0.55, - "output": 2.75 + "input": 0.25, + "output": 2.5, + "cache_read": 0.0625 }, "type": "chat" - } - ] - }, - "alibaba-coding-plan-cn": { - "id": "alibaba-coding-plan-cn", - "name": "Alibaba Coding Plan (China)", - "display_name": "Alibaba Coding Plan (China)", - "api": "https://coding.dashscope.aliyuncs.com/v1", - "doc": "https://help.aliyun.com/zh/model-studio/coding-plan", - "models": [ + }, { - "id": "qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "xai/grok-4-1-fast-non-reasoning", + "name": "Grok 4.1 Fast (Non-Reasoning)", + "display_name": "Grok 4.1 Fast (Non-Reasoning)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" - }, + } + ] + }, + "alibaba-coding-plan": { + "id": "alibaba-coding-plan", + "name": "Alibaba Coding Plan", + "display_name": "Alibaba Coding Plan", + "api": "https://coding-intl.dashscope.aliyuncs.com/v1", + "doc": "https://www.alibabacloud.com/help/en/model-studio/coding-plan", + "models": [ { "id": "kimi-k2.5", "name": "Kimi K2.5", @@ -113545,7 +120697,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" @@ -113586,20 +120739,22 @@ "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -113619,10 +120774,10 @@ } }, "attachment": false, - "open_weights": true, + "open_weights": false, "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { "input": 0, "output": 0, @@ -113632,9 +120787,9 @@ "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "qwen3-coder-next", + "name": "Qwen3 Coder Next", + "display_name": "Qwen3 Coder Next", "modalities": { "input": [ "text" @@ -113644,30 +120799,18 @@ ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "open_weights": true, + "release_date": "2026-02-03", + "last_updated": "2026-02-03", "cost": { "input": 0, "output": 0, @@ -113677,20 +120820,22 @@ "type": "chat" }, { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 24576 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -113710,9 +120855,10 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { "input": 0, "output": 0, @@ -113722,22 +120868,20 @@ "type": "chat" }, { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 196608, + "output": 24576 }, "temperature": true, "tool_call": true, @@ -113757,10 +120901,9 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { "input": 0, "output": 0, @@ -113815,9 +120958,9 @@ "type": "chat" }, { - "id": "qwen3-coder-next", - "name": "Qwen3 Coder Next", - "display_name": "Qwen3 Coder Next", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -113827,18 +120970,31 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 202752, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2026-02-03", - "last_updated": "2026-02-03", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { "input": 0, "output": 0, @@ -113848,21 +121004,20 @@ "type": "chat" }, { - "id": "qwen3.5-plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 202752, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -113883,9 +121038,8 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { "input": 0, "output": 0, @@ -113893,130 +121047,22 @@ "cache_write": 0 }, "type": "chat" - } - ] - }, - "mistral": { - "id": "mistral", - "name": "Mistral", - "display_name": "Mistral", - "doc": "https://docs.mistral.ai/getting-started/models/", - "models": [ - { - "id": "mistral-small-latest", - "name": "Mistral Small (latest)", - "display_name": "Mistral Small (latest)", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 256000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-03-16", - "last_updated": "2026-03-16", - "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" - }, - { - "id": "mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 128000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-07-01", - "last_updated": "2024-07-01", - "cost": { - "input": 0.15, - "output": 0.15 - }, - "type": "chat" }, { - "id": "mistral-large-2512", - "name": "Mistral Large 3", - "display_name": "Mistral Large 3", + "id": "qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", "modalities": { "input": [ - "text", - "image" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 262144, - "output": 262144 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2025-12-02", - "cost": { - "input": 0.5, - "output": 1.5 - }, - "type": "chat" - }, - { - "id": "labs-devstral-small-2512", - "name": "Devstral Small 2", - "display_name": "Devstral Small 2", - "modalities": { - "input": [ - "text", - "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -114025,51 +121071,30 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { "input": 0, - "output": 0 - }, - "type": "chat" - }, - { - "id": "devstral-2512", - "name": "Devstral 2", - "display_name": "Devstral 2", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 262144 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", - "cost": { - "input": 0.4, - "output": 2 + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "meganova": { + "id": "meganova", + "name": "Meganova", + "display_name": "Meganova", + "api": "https://api.meganova.ai/v1", + "doc": "https://docs.meganova.ai", + "models": [ { - "id": "magistral-medium-latest", - "name": "Magistral Medium (latest)", - "display_name": "Magistral Medium (latest)", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ "text" @@ -114079,30 +121104,41 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 163840, + "output": 64000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-03-17", - "last_updated": "2025-03-20", + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 2, - "output": 5 + "input": 0.5, + "output": 2.15 }, "type": "chat" }, { - "id": "open-mixtral-8x7b", - "name": "Mixtral 8x7B", - "display_name": "Mixtral 8x7B", + "id": "deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text" @@ -114112,8 +121148,8 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, @@ -114122,52 +121158,49 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-01", - "release_date": "2023-12-11", - "last_updated": "2023-12-11", + "release_date": "2025-08-25", + "last_updated": "2025-08-25", "cost": { - "input": 0.7, - "output": 0.7 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "pixtral-large-latest", - "name": "Pixtral Large (latest)", - "display_name": "Pixtral Large (latest)", + "id": "deepseek-ai/DeepSeek-V3-0324", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2024-11-04", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 2, - "output": 6 + "input": 0.25, + "output": 0.88 }, "type": "chat" }, { - "id": "mistral-large-2411", - "name": "Mistral Large 2.1", - "display_name": "Mistral Large 2.1", + "id": "deepseek-ai/DeepSeek-V3.2-Exp", + "name": "DeepSeek V3.2 Exp", + "display_name": "DeepSeek V3.2 Exp", "modalities": { "input": [ "text" @@ -114177,8 +121210,8 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, @@ -114187,19 +121220,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2024-11-04", + "release_date": "2025-10-10", + "last_updated": "2025-10-10", "cost": { - "input": 2, - "output": 6 + "input": 0.27, + "output": 0.4 }, "type": "chat" }, { - "id": "codestral-latest", - "name": "Codestral (latest)", - "display_name": "Codestral (latest)", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -114209,33 +121241,36 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-05-29", - "last_updated": "2025-01-04", + "release_date": "2025-12-03", + "last_updated": "2025-12-03", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.26, + "output": 0.38 }, "type": "chat" }, { - "id": "mistral-large-latest", - "name": "Mistral Large (latest)", - "display_name": "Mistral Large (latest)", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -114248,56 +121283,35 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2025-12-02", - "cost": { - "input": 0.5, - "output": 1.5 - }, - "type": "chat" - }, - { - "id": "mistral-small-2506", - "name": "Mistral Small 3.2", - "display_name": "Mistral Small 3.2", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 16384 + "supported": true, + "default": true }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-06-20", - "last_updated": "2025-06-20", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.6, + "output": 2.6 }, "type": "chat" }, { - "id": "pixtral-12b", - "name": "Pixtral 12B", - "display_name": "Pixtral 12B", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", @@ -114308,92 +121322,41 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-09-01", - "last_updated": "2024-09-01", - "cost": { - "input": 0.15, - "output": 0.15 - }, - "type": "chat" - }, - { - "id": "ministral-8b-latest", - "name": "Ministral 8B (latest)", - "display_name": "Ministral 8B (latest)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 128000 + "supported": true, + "default": true }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-04", - "cost": { - "input": 0.1, - "output": 0.1 - }, - "type": "chat" - }, - { - "id": "mistral-embed", - "name": "Mistral Embed", - "display_name": "Mistral Embed", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8000, - "output": 3072 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2023-12-11", - "last_updated": "2023-12-11", + "knowledge": "2026-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.1, - "output": 0 + "input": 0.45, + "output": 2.8 }, "type": "chat" }, { - "id": "magistral-small", - "name": "Magistral Small", - "display_name": "Magistral Small", + "id": "zai-org/GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -114403,8 +121366,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -114412,33 +121375,43 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-03-17", - "last_updated": "2025-03-17", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "mistral-small-2603", - "name": "Mistral Small 4", - "display_name": "Mistral Small 4", + "id": "zai-org/GLM-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -114446,21 +121419,31 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.8, + "output": 2.56 }, "type": "chat" }, { - "id": "ministral-3b-latest", - "name": "Ministral 3B (latest)", - "display_name": "Ministral 3B (latest)", + "id": "zai-org/GLM-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -114470,29 +121453,41 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-04", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.04, - "output": 0.04 + "input": 0.45, + "output": 1.9 }, "type": "chat" }, { - "id": "open-mixtral-8x22b", - "name": "Mixtral 8x22B", - "display_name": "Mixtral 8x22B", + "id": "mistralai/Mistral-Nemo-Instruct-2407", + "name": "Mistral Nemo Instruct 2407", + "display_name": "Mistral Nemo Instruct 2407", "modalities": { "input": [ "text" @@ -114502,8 +121497,8 @@ ] }, "limit": { - "context": 64000, - "output": 64000 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -114512,19 +121507,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-04-17", - "last_updated": "2024-04-17", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 2, - "output": 6 + "input": 0.02, + "output": 0.04 }, "type": "chat" }, { - "id": "mistral-medium-2604", - "name": "Mistral Medium 3.5", - "display_name": "Mistral Medium 3.5", + "id": "mistralai/Mistral-Small-3.2-24B-Instruct-2506", + "name": "Mistral Small 3.2 24B Instruct", + "display_name": "Mistral Small 3.2 24B Instruct", "modalities": { "input": [ "text", @@ -114535,29 +121529,29 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": true, - "release_date": "2026-04-29", - "last_updated": "2026-04-29", + "knowledge": "2024-10", + "release_date": "2025-06-20", + "last_updated": "2025-06-20", "cost": { - "input": 1.5, - "output": 7.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "devstral-small-2505", - "name": "Devstral Small 2505", - "display_name": "Devstral Small 2505", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -114567,8 +121561,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -114577,9 +121571,8 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { "input": 0.1, "output": 0.3 @@ -114587,9 +121580,9 @@ "type": "chat" }, { - "id": "devstral-medium-2507", - "name": "Devstral Medium", - "display_name": "Devstral Medium", + "id": "XiaomiMiMo/MiMo-V2-Flash", + "name": "MiMo V2 Flash", + "display_name": "MiMo V2 Flash", "modalities": { "input": [ "text" @@ -114599,29 +121592,30 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-07-10", - "last_updated": "2025-07-10", + "knowledge": "2024-12-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.4, - "output": 2 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "open-mistral-7b", - "name": "Mistral 7B", - "display_name": "Mistral 7B", + "id": "MiniMaxAI/MiniMax-M2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "modalities": { "input": [ "text" @@ -114631,29 +121625,40 @@ ] }, "limit": { - "context": 8000, - "output": 8000 + "context": 196608, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2023-09-27", - "last_updated": "2023-09-27", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.25, - "output": 0.25 + "input": 0.28, + "output": 1.2 }, "type": "chat" }, { - "id": "devstral-medium-latest", - "name": "Devstral 2 (latest)", - "display_name": "Devstral 2 (latest)", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -114663,62 +121668,87 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.4, - "output": 2 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "mistral-medium-2505", - "name": "Mistral Medium 3", - "display_name": "Mistral Medium 3", + "id": "Qwen/Qwen3.5-Plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "knowledge": "2025-04", + "release_date": "2026-02", + "last_updated": "2026-02", "cost": { "input": 0.4, - "output": 2 + "output": 2.4, + "reasoning": 2.4 }, "type": "chat" }, { - "id": "devstral-small-2507", - "name": "Devstral Small", - "display_name": "Devstral Small", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -114728,8 +121758,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -114738,52 +121768,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-07-10", - "last_updated": "2025-07-10", - "cost": { - "input": 0.1, - "output": 0.3 - }, - "type": "chat" - }, - { - "id": "mistral-medium-2508", - "name": "Mistral Medium 3.1", - "display_name": "Mistral Medium 3.1", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 262144 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-08-12", - "last_updated": "2025-08-12", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.4, - "output": 2 + "input": 0.09, + "output": 0.6 }, "type": "chat" }, { - "id": "mistral-medium-latest", - "name": "Mistral Medium (latest)", - "display_name": "Mistral Medium (latest)", + "id": "Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen2.5 VL 32B Instruct", + "display_name": "Qwen2.5 VL 32B Instruct", "modalities": { "input": [ "text", @@ -114794,38 +121790,37 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 16384, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": true, - "release_date": "2026-04-29", - "last_updated": "2026-04-29", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 1.5, - "output": 7.5 + "input": 0.2, + "output": 0.6 }, "type": "chat" } ] }, - "ovhcloud": { - "id": "ovhcloud", - "name": "OVHcloud AI Endpoints", - "display_name": "OVHcloud AI Endpoints", - "api": "https://oai.endpoints.kepler.ai.cloud.ovh.net/v1", - "doc": "https://www.ovhcloud.com/en/public-cloud/ai-endpoints/catalog//", + "synthetic": { + "id": "synthetic", + "name": "Synthetic", + "display_name": "Synthetic", + "api": "https://api.synthetic.new/openai/v1", + "doc": "https://synthetic.new/pricing", "models": [ { - "id": "meta-llama-3_3-70b-instruct", - "name": "Meta-Llama-3_3-70B-Instruct", - "display_name": "Meta-Llama-3_3-70B-Instruct", + "id": "hf:deepseek-ai/DeepSeek-R1", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ "text" @@ -114835,28 +121830,41 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2025-04-01", - "last_updated": "2025-04-01", + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.74, - "output": 0.74 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "mistral-7b-instruct-v0.3", - "name": "Mistral-7B-Instruct-v0.3", - "display_name": "Mistral-7B-Instruct-v0.3", + "id": "hf:deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek R1 (0528)", + "display_name": "DeepSeek R1 (0528)", "modalities": { "input": [ "text" @@ -114866,28 +121874,40 @@ ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-01", - "last_updated": "2025-04-01", + "open_weights": false, + "release_date": "2025-08-01", + "last_updated": "2025-08-01", "cost": { - "input": 0.11, - "output": 0.11 + "input": 3, + "output": 8 }, "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3-32B", - "display_name": "Qwen3-32B", + "id": "hf:deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ "text" @@ -114897,8 +121917,8 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -114906,63 +121926,52 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-16", - "last_updated": "2025-07-16", + "open_weights": false, + "release_date": "2025-09-22", + "last_updated": "2025-09-25", "cost": { - "input": 0.09, - "output": 0.25 + "input": 1.2, + "output": 1.2 }, "type": "chat" }, { - "id": "qwen2.5-vl-72b-instruct", - "name": "Qwen2.5-VL-72B-Instruct", - "display_name": "Qwen2.5-VL-72B-Instruct", + "id": "hf:deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-03-31", - "last_updated": "2025-03-31", + "attachment": false, + "open_weights": false, + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 1.01, - "output": 1.01 + "input": 0.56, + "output": 1.68 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3-Coder-30B-A3B-Instruct", - "display_name": "Qwen3-Coder-30B-A3B-Instruct", + "id": "hf:deepseek-ai/DeepSeek-V3-0324", + "name": "DeepSeek V3 (0324)", + "display_name": "DeepSeek V3 (0324)", "modalities": { "input": [ "text" @@ -114972,8 +121981,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -114981,19 +121990,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-10-28", - "last_updated": "2025-10-28", + "open_weights": false, + "release_date": "2025-08-01", + "last_updated": "2025-08-01", "cost": { - "input": 0.07, - "output": 0.26 + "input": 1.2, + "output": 1.2 }, "type": "chat" }, { - "id": "gpt-oss-20b", - "name": "gpt-oss-20b", - "display_name": "gpt-oss-20b", + "id": "hf:deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -115003,9 +122012,10 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 162816, + "output": 8000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -115018,54 +122028,56 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.05, - "output": 0.18 + "input": 0.27, + "output": 0.4, + "cache_read": 0.27, + "cache_write": 0 }, "type": "chat" }, { - "id": "mistral-small-3.2-24b-instruct-2506", - "name": "Mistral-Small-3.2-24B-Instruct-2506", - "display_name": "Mistral-Small-3.2-24B-Instruct-2506", + "id": "hf:deepseek-ai/DeepSeek-V3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-07-16", - "last_updated": "2025-07-16", + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", "cost": { - "input": 0.1, - "output": 0.31 + "input": 1.25, + "output": 1.25 }, "type": "chat" }, { - "id": "qwen3.5-9b", - "name": "Qwen3.5-9B", - "display_name": "Qwen3.5-9B", + "id": "hf:moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -115078,7 +122090,8 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -115091,32 +122104,35 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-02-15", - "last_updated": "2026-02-15", + "knowledge": "2025-11", + "release_date": "2025-11-07", + "last_updated": "2025-11-07", "cost": { - "input": 0.1, - "output": 0.15 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "hf:moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -115124,23 +122140,30 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.09, - "output": 0.47 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "mistral-nemo-instruct-2407", - "name": "Mistral-Nemo-Instruct-2407", - "display_name": "Mistral-Nemo-Instruct-2407", + "id": "hf:moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -115150,8 +122173,8 @@ ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -115160,18 +122183,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-11-20", - "last_updated": "2024-11-20", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.14, - "output": 0.14 + "input": 1.2, + "output": 1.2 }, "type": "chat" }, { - "id": "llama-3.1-8b-instruct", - "name": "Llama-3.1-8B-Instruct", - "display_name": "Llama-3.1-8B-Instruct", + "id": "hf:Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ "text" @@ -115181,37 +122205,41 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2025-06-11", - "last_updated": "2025-06-11", + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 0.11, - "output": 0.11 + "input": 0.65, + "output": 3 }, "type": "chat" - } - ] - }, - "friendli": { - "id": "friendli", - "name": "Friendli", - "display_name": "Friendli", - "api": "https://api.friendli.ai/serverless/v1", - "doc": "https://friendli.ai/docs/guides/serverless_endpoints/introduction", - "models": [ + }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "hf:Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen 3 235B Instruct", + "display_name": "Qwen 3 235B Instruct", "modalities": { "input": [ "text" @@ -115221,8 +122249,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -115231,29 +122259,31 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-07-29", - "last_updated": "2026-01-29", + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-07-21", "cost": { "input": 0.2, - "output": 0.8 + "output": 0.6 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "hf:Qwen/Qwen3.5-397B-A17B", + "name": "Qwen3.5-97B-A17B", + "display_name": "Qwen3.5-97B-A17B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 202752 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -115274,19 +122304,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-04-07", - "last_updated": "2026-04-07", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 0.6, + "output": 3, + "cache_read": 0.6 }, "type": "chat" }, { - "id": "zai-org/GLM-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "hf:Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen2.5-Coder-32B-Instruct", + "display_name": "Qwen2.5-Coder-32B-Instruct", "modalities": { "input": [ "text" @@ -115296,41 +122326,29 @@ ] }, "limit": { - "context": 202752, - "output": 202752 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2024-10", + "release_date": "2024-11-11", + "last_updated": "2024-11-11", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.5 + "input": 0.8, + "output": 0.8 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "hf:Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen 3 Coder 480B", + "display_name": "Qwen 3 Coder 480B", "modalities": { "input": [ "text" @@ -115340,8 +122358,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -115350,18 +122368,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-08-01", - "last_updated": "2025-12-23", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.6, - "output": 0.6 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.1-8B-Instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "hf:openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -115371,18 +122390,24 @@ ] }, "limit": { - "context": 131072, - "output": 8000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2024-08-01", - "last_updated": "2025-12-23", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { "input": 0.1, "output": 0.1 @@ -115390,9 +122415,9 @@ "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "hf:zai-org/GLM-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ "text" @@ -115402,8 +122427,8 @@ ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -115424,28 +122449,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.55, + "output": 2.19 }, "type": "chat" - } - ] - }, - "cortecs": { - "id": "cortecs", - "name": "Cortecs", - "display_name": "Cortecs", - "api": "https://api.cortecs.ai/v1", - "doc": "https://api.cortecs.ai/v1/models", - "models": [ + }, { - "id": "minimax-m2.7", - "name": "MiniMax-m2.7", - "display_name": "MiniMax-m2.7", + "id": "hf:zai-org/GLM-4.7-Flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ "text" @@ -115455,8 +122471,8 @@ ] }, "limit": { - "context": 202752, - "output": 196072 + "context": 196608, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -115477,31 +122493,30 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2026-01-18", + "last_updated": "2026-01-18", "cost": { - "input": 0.47, - "output": 1.4 + "input": 0.06, + "output": 0.4, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "hf:zai-org/GLM-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 196608, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -115511,70 +122526,41 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", - "cost": { - "input": 1.09, - "output": 5.43 - }, - "type": "chat" - }, - { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131000, - "output": 131000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "release_date": "2026-02-12", + "last_updated": "2026-04-08", "cost": { - "input": 0.062, - "output": 0.408 + "input": 1, + "output": 3, + "cache_read": 1 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "hf:zai-org/GLM-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 196608, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -115595,19 +122581,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "release_date": "2026-03-27", + "last_updated": "2026-04-12", "cost": { - "input": 0.55, - "output": 2.76 + "input": 1, + "output": 3, + "cache_read": 1 }, "type": "chat" }, { - "id": "deepseek-v3-0324", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "hf:zai-org/GLM-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ "text" @@ -115617,29 +122603,35 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.551, - "output": 1.654 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "hf:nvidia/NVIDIA-Nemotron-3-Super-120B-A12B-NVFP4", + "name": "Nemotron 3 Super 120B", + "display_name": "Nemotron 3 Super 120B", "modalities": { "input": [ "text" @@ -115649,8 +122641,8 @@ ] }, "limit": { - "context": 198000, - "output": 198000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -115671,67 +122663,32 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2024-04", + "release_date": "2026-03-11", + "last_updated": "2026-04-03", "cost": { - "input": 0.45, - "output": 2.23 + "input": 0.3, + "output": 1, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "claude-opus4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "hf:nvidia/Kimi-K2.5-NVFP4", + "name": "Kimi K2.5 (NVFP4)", + "display_name": "Kimi K2.5 (NVFP4)", "modalities": { "input": [ "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 128000 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", - "cost": { - "input": 5.6, - "output": 27.99, - "cache_read": 0.56, - "cache_write": 6.99 - }, - "type": "chat" - }, - { - "id": "glm-5", - "name": "GLM 5", - "display_name": "GLM 5", - "modalities": { - "input": [ - "text" + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 202752 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -115752,51 +122709,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", - "cost": { - "input": 1.08, - "output": 3.44 - }, - "type": "chat" - }, - { - "id": "nova-pro-v1", - "name": "Nova Pro 1.0", - "display_name": "Nova Pro 1.0", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 300000, - "output": 5000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 1.016, - "output": 4.061 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "devstral-2512", - "name": "Devstral 2 2512", - "display_name": "Devstral 2 2512", + "id": "hf:MiniMaxAI/MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -115806,29 +122731,40 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0, - "output": 0 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "hf:MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -115838,13 +122774,14 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 191488, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -115859,19 +122796,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "release_date": "2026-02-07", + "last_updated": "2026-02-07", "cost": { - "input": 0.099, - "output": 0.33 + "input": 0.6, + "output": 3, + "cache_read": 0.6 }, "type": "chat" }, { - "id": "codestral-2508", - "name": "Codestral 2508", - "display_name": "Codestral 2508", + "id": "hf:MiniMaxAI/MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ "text" @@ -115881,43 +122818,45 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 196608, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 0.3, - "output": 0.9, - "cache_read": 0.03 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "claude-4-5-sonnet", - "name": "Claude 4.5 Sonnet", - "display_name": "Claude 4.5 Sonnet", + "id": "hf:meta-llama/Llama-3.1-8B-Instruct", + "name": "Llama-3.1-8B-Instruct", + "display_name": "Llama-3.1-8B-Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -115925,53 +122864,54 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 3.259, - "output": 16.296 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "hf:meta-llama/Llama-4-Scout-17B-16E-Instruct", + "name": "Llama-4-Scout-17B-16E-Instruct", + "display_name": "Llama-4-Scout-17B-16E-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 328000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-07-11", - "last_updated": "2025-09-05", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.551, - "output": 2.646 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "nemotron-3-super-120b-a12b", - "name": "Nemotron 3 Super 120B A12B", - "display_name": "Nemotron 3 Super 120B A12B", + "id": "hf:meta-llama/Llama-3.1-70B-Instruct", + "name": "Llama-3.1-70B-Instruct", + "display_name": "Llama-3.1-70B-Instruct", "modalities": { "input": [ "text" @@ -115981,8 +122921,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -115992,19 +122932,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-03-11", - "last_updated": "2026-03-11", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.266, - "output": 0.799 + "input": 0.9, + "output": 0.9 }, "type": "chat" }, { - "id": "minimax-m2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "hf:meta-llama/Llama-3.1-405B-Instruct", + "name": "Llama-3.1-405B-Instruct", + "display_name": "Llama-3.1-405B-Instruct", "modalities": { "input": [ "text" @@ -116014,8 +122954,8 @@ ] }, "limit": { - "context": 400000, - "output": 400000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -116023,98 +122963,32 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.39, - "output": 1.57 + "input": 3, + "output": 3 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "hf:meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ - "text", - "image" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 1048576, - "output": 65535 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-17", - "cost": { - "input": 1.654, - "output": 11.024 - }, - "type": "chat" - }, - { - "id": "claude-opus4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", - "modalities": { - "input": [ - "text", - "image", - "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -116122,21 +122996,21 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 5.98, - "output": 29.89 + "input": 0.9, + "output": 0.9 }, "type": "chat" }, { - "id": "devstral-small-2512", - "name": "Devstral Small 2 2512", - "display_name": "Devstral Small 2 2512", + "id": "hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", + "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", "modalities": { "input": [ "text", @@ -116147,40 +123021,41 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 524000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0, - "output": 0 + "input": 0.22, + "output": 0.88 }, "type": "chat" }, { - "id": "minimax-m2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "hf:moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 196000, - "output": 196000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -116199,31 +123074,42 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.34, - "output": 1.34 + "input": 0.95, + "output": 4, + "cache_read": 0.95 }, "type": "chat" - }, + } + ] + }, + "azure": { + "id": "azure", + "name": "Azure", + "display_name": "Azure", + "doc": "https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models", + "models": [ { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -116244,30 +123130,32 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-04-14", - "last_updated": "2026-04-14", + "knowledge": "2025-01", + "release_date": "2026-02-06", + "last_updated": "2026-02-06", "cost": { - "input": 1.31, - "output": 4.1, - "cache_read": 0.24 + "input": 0.6, + "output": 3 }, "type": "chat" }, { - "id": "glm-4.5", - "name": "GLM 4.5", - "display_name": "GLM 4.5", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -116277,78 +123165,67 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.67, - "output": 2.46 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "claude-opus4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "text-embedding-3-large", + "name": "text-embedding-3-large", + "display_name": "text-embedding-3-large", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 8191, + "output": 3072 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 5.98, - "output": 29.89 + "input": 0.13, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "mistral-large-2411", + "name": "Mistral Large 24.11", + "display_name": "Mistral Large 24.11", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -116357,19 +123234,19 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 3.307, - "output": 16.536 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "phi-4-reasoning-plus", + "name": "Phi-4-reasoning-plus", + "display_name": "Phi-4-reasoning-plus", "modalities": { "input": [ "text" @@ -116379,41 +123256,30 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 32000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-11", - "last_updated": "2025-09-11", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.164, - "output": 1.311 + "input": 0.125, + "output": 0.5 }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "gpt-3.5-turbo-0301", + "name": "GPT-3.5 Turbo 0301", + "display_name": "GPT-3.5 Turbo 0301", "modalities": { "input": [ "text" @@ -116423,75 +123289,64 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 4096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-01", - "last_updated": "2025-08-01", + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2023-03-01", + "last_updated": "2023-03-01", "cost": { - "input": 0.22, - "output": 1.34 + "input": 1.5, + "output": 2 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "phi-4-multimodal", + "name": "Phi-4-multimodal", + "display_name": "Phi-4-multimodal", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.81, - "output": 3.54, - "cache_read": 0.2 + "input": 0.08, + "output": 0.32, + "input_audio": 4 }, "type": "chat" }, { - "id": "qwen3-coder-next", - "name": "Qwen3 Coder Next 80B", - "display_name": "Qwen3 Coder Next 80B", + "id": "meta-llama-3.1-405b-instruct", + "name": "Meta-Llama-3.1-405B-Instruct", + "display_name": "Meta-Llama-3.1-405B-Instruct", "modalities": { "input": [ "text" @@ -116501,97 +123356,119 @@ ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-04", - "last_updated": "2026-02-04", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.158, - "output": 0.84 + "input": 5.33, + "output": 16 }, "type": "chat" }, { - "id": "claude-4-6-sonnet", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "gpt-4-turbo-vision", + "name": "GPT-4 Turbo Vision", + "display_name": "GPT-4 Turbo Vision", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 3.59, - "output": 17.92 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.441, - "output": 1.984 + "input": 1.75, + "output": 14, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "mixtral-8x7B-instruct-v0.1", - "name": "Mixtral 8x7B Instruct v0.1", - "display_name": "Mixtral 8x7B Instruct v0.1", + "id": "gpt-3.5-turbo-0125", + "name": "GPT-3.5 Turbo 0125", + "display_name": "GPT-3.5 Turbo 0125", "modalities": { "input": [ "text" @@ -116601,30 +123478,29 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 16384, + "output": 16384 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-09", - "release_date": "2023-12-11", - "last_updated": "2023-12-11", + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0.438, - "output": 0.68 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "hermes-4-70b", - "name": "Hermes 4 70B", - "display_name": "Hermes 4 70B", + "id": "meta-llama-3.1-70b-instruct", + "name": "Meta-Llama-3.1-70B-Instruct", + "display_name": "Meta-Llama-3.1-70B-Instruct", "modalities": { "input": [ "text" @@ -116635,29 +123511,28 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, "knowledge": "2023-12", - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.116, - "output": 0.358 + "input": 2.68, + "output": 3.54 }, "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -116667,11 +123542,11 @@ ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 163840, + "output": 163840 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -116689,56 +123564,52 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.32, - "output": 1.18 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.266, - "output": 0.444 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "intellect-3", - "name": "INTELLECT 3", - "display_name": "INTELLECT 3", + "id": "o1-preview", + "name": "o1-preview", + "display_name": "o1-preview", "modalities": { "input": [ "text" @@ -116749,29 +123620,44 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-11", - "release_date": "2025-11-26", - "last_updated": "2025-11-26", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 0.219, - "output": 1.202 + "input": 16.5, + "output": 66, + "cache_read": 8.25 }, "type": "chat" }, { - "id": "glm-4.7-flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "text-embedding-ada-002", + "name": "text-embedding-ada-002", + "display_name": "text-embedding-ada-002", "modalities": { "input": [ "text" @@ -116781,110 +123667,122 @@ ] }, "limit": { - "context": 203000, - "output": 203000 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "open_weights": false, + "release_date": "2022-12-15", + "last_updated": "2022-12-15", "cost": { - "input": 0.09, - "output": 0.53 + "input": 0.1, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "gpt-oss-120b", - "name": "GPT Oss 120b", - "display_name": "GPT Oss 120b", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex Mini", + "display_name": "GPT-5.1 Codex Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-01", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "qwen-2.5-72b-instruct", - "name": "Qwen2.5 72B Instruct", - "display_name": "Qwen2.5 72B Instruct", + "id": "grok-4-1-fast-reasoning", + "name": "Grok 4.1 Fast (Reasoning)", + "display_name": "Grok 4.1 Fast (Reasoning)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 33000, - "output": 33000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2024-09-19", - "last_updated": "2024-09-19", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-06-27", + "last_updated": "2025-06-27", "cost": { - "input": 0.062, - "output": 0.231 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { "id": "deepseek-r1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ "text" @@ -116894,8 +123792,8 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, @@ -116920,27 +123818,26 @@ "release_date": "2025-05-28", "last_updated": "2025-05-28", "cost": { - "input": 0.585, - "output": 2.307 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "GPT 4.1", - "display_name": "GPT 4.1", + "id": "deepseek-v3-0324", + "name": "DeepSeek-V3-0324", + "display_name": "DeepSeek-V3-0324", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -116948,20 +123845,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 2.354, - "output": 9.417 + "input": 1.14, + "output": 4.56 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "cohere-embed-v3-multilingual", + "name": "Embed v3 Multilingual", + "display_name": "Embed v3 Multilingual", "modalities": { "input": [ "text" @@ -116971,41 +123868,28 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 512, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "release_date": "2023-11-07", + "last_updated": "2023-11-07", "cost": { - "input": 0.656, - "output": 2.731 + "input": 0.1, + "output": 0 }, "type": "chat" }, { - "id": "llama-3.1-405b-instruct", - "name": "Llama 3.1 405B Instruct", - "display_name": "Llama 3.1 405B Instruct", + "id": "deepseek-v3.2-speciale", + "name": "DeepSeek-V3.2-Speciale", + "display_name": "DeepSeek-V3.2-Speciale", "modalities": { "input": [ "text" @@ -117019,25 +123903,26 @@ "output": 128000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0, - "output": 0 + "input": 0.58, + "output": 1.68 }, "type": "chat" }, { - "id": "qwen3.5-122b-a10b", - "name": "Qwen3.5 122B A10B", - "display_name": "Qwen3.5 122B A10B", + "id": "phi-3-medium-128k-instruct", + "name": "Phi-3-medium-instruct (128k)", + "display_name": "Phi-3-medium-instruct (128k)", "modalities": { "input": [ "text" @@ -117047,41 +123932,29 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.444, - "output": 3.106 + "input": 0.17, + "output": 0.68 }, "type": "chat" }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "codestral-2501", + "name": "Codestral 25.01", + "display_name": "Codestral 25.01", "modalities": { "input": [ "text" @@ -117091,108 +123964,100 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.089, - "output": 0.275 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "mistral-large-2512", - "name": "Mistral Large 3 2512", - "display_name": "Mistral Large 3 2512", + "id": "deepseek-v3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2025-12", + "knowledge": "2024-07", "release_date": "2025-12-01", "last_updated": "2025-12-01", "cost": { - "input": 0.5, - "output": 1.5, - "cache_read": 0.05 + "input": 0.58, + "output": 1.68 }, "type": "chat" }, { - "id": "qwen3.5-397b-a17b", - "name": "Qwen3.5 397B A17B", - "display_name": "Qwen3.5 397B A17B", + "id": "grok-4-1-fast-non-reasoning", + "name": "Grok 4.1 Fast (Non-Reasoning)", + "display_name": "Grok 4.1 Fast (Non-Reasoning)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 250000, - "output": 250000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "attachment": true, + "open_weights": false, + "release_date": "2025-06-27", + "last_updated": "2025-06-27", "cost": { - "input": 0.6, - "output": 3.6 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "phi-3-medium-4k-instruct", + "name": "Phi-3-medium-instruct (4k)", + "display_name": "Phi-3-medium-instruct (4k)", "modalities": { "input": [ "text" @@ -117202,42 +124067,29 @@ ] }, "limit": { - "context": 1048576, - "output": 384000 + "context": 4096, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.133, - "output": 0.266, - "cache_read": 0.028 + "input": 0.17, + "output": 0.68 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "phi-4", + "name": "Phi-4", + "display_name": "Phi-4", "modalities": { "input": [ "text" @@ -117247,53 +124099,42 @@ ] }, "limit": { - "context": 1048576, - "output": 384000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 1.553, - "output": 3.106, - "cache_read": 0.145 + "input": 0.125, + "output": 0.5 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -117301,30 +124142,28 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-31", - "last_updated": "2025-07-31", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.053, - "output": 0.222 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" - } - ] - }, - "siliconflow-com": { - "id": "siliconflow-com", - "name": "SiliconFlow", - "display_name": "SiliconFlow", - "api": "https://api.siliconflow.com/v1", - "doc": "https://cloud.siliconflow.com/models", - "models": [ + }, { - "id": "nex-agi/DeepSeek-V3.1-Nex-N1", - "name": "nex-agi/DeepSeek-V3.1-Nex-N1", - "display_name": "nex-agi/DeepSeek-V3.1-Nex-N1", + "id": "mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -117334,118 +124173,107 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.5, - "output": 2 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-72B-Instruct", - "name": "Qwen/Qwen2.5-VL-72B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-72B-Instruct", + "id": "phi-3-mini-128k-instruct", + "name": "Phi-3-mini-instruct (128k)", + "display_name": "Phi-3-mini-instruct (128k)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 4000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-01-28", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.59, - "output": 0.59 + "input": 0.13, + "output": 0.52 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-32B-Thinking", - "name": "Qwen/Qwen3-VL-32B-Thinking", - "display_name": "Qwen/Qwen3-VL-32B-Thinking", + "id": "gpt-3.5-turbo-instruct", + "name": "GPT-3.5 Turbo Instruct", + "display_name": "GPT-3.5 Turbo Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 4096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-21", - "last_updated": "2025-11-25", + "knowledge": "2021-08", + "release_date": "2023-09-21", + "last_updated": "2023-09-21", "cost": { - "input": 0.2, - "output": 1.5 + "input": 1.5, + "output": 2 }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", - "name": "Qwen/Qwen3-30B-A3B-Thinking-2507", - "display_name": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "id": "gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 131000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -117454,103 +124282,111 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, "open_weights": false, - "release_date": "2025-07-31", - "last_updated": "2025-11-25", + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.09, - "output": 0.3 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-235B-A22B-Thinking", - "name": "Qwen/Qwen3-VL-235B-A22B-Thinking", - "display_name": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "id": "phi-4-reasoning", + "name": "Phi-4-reasoning", + "display_name": "Phi-4-reasoning", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 32000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.45, - "output": 3.5 + "input": 0.125, + "output": 0.5 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-7B-Instruct", - "name": "Qwen/Qwen2.5-7B-Instruct", - "display_name": "Qwen/Qwen2.5-7B-Instruct", + "id": "gpt-5.1-chat", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.05, - "output": 0.05 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-Coder-32B-Instruct", - "name": "Qwen/Qwen2.5-Coder-32B-Instruct", - "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "id": "phi-3-small-128k-instruct", + "name": "Phi-3-small-instruct (128k)", + "display_name": "Phi-3-small-instruct (128k)", "modalities": { "input": [ "text" @@ -117560,28 +124396,29 @@ ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-11-11", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.18, - "output": 0.18 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", - "name": "Qwen/Qwen3-VL-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "id": "model-router", + "name": "Model Router", + "display_name": "Model Router", "modalities": { "input": [ "text", @@ -117592,28 +124429,27 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-10-05", - "last_updated": "2025-11-25", + "release_date": "2025-05-19", + "last_updated": "2025-11-18", "cost": { - "input": 0.29, - "output": 1 + "input": 0.14, + "output": 0 }, "type": "chat" }, { - "id": "Qwen/QwQ-32B", - "name": "Qwen/QwQ-32B", - "display_name": "Qwen/QwQ-32B", + "id": "phi-3-small-8k-instruct", + "name": "Phi-3-small-instruct (8k)", + "display_name": "Phi-3-small-instruct (8k)", "modalities": { "input": [ "text" @@ -117623,40 +124459,29 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-03-06", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { "input": 0.15, - "output": 0.58 + "output": 0.6 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B", - "name": "Qwen/Qwen3-235B-A22B", - "display_name": "Qwen/Qwen3-235B-A22B", + "id": "phi-3.5-moe-instruct", + "name": "Phi-3.5-MoE-instruct", + "display_name": "Phi-3.5-MoE-instruct", "modalities": { "input": [ "text" @@ -117666,114 +124491,91 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.35, - "output": 1.42 + "input": 0.16, + "output": 0.64 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Captioner", - "name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "id": "phi-3.5-mini-instruct", + "name": "Phi-3.5-mini-instruct", + "display_name": "Phi-3.5-mini-instruct", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 66000, - "output": 66000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.13, + "output": 0.52 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-8B-Thinking", - "name": "Qwen/Qwen3-VL-8B-Thinking", - "display_name": "Qwen/Qwen3-VL-8B-Thinking", + "id": "text-embedding-3-small", + "name": "text-embedding-3-small", + "display_name": "text-embedding-3-small", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 8191, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0.18, - "output": 2 + "input": 0.02, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "Qwen/Qwen2.5-VL-7B-Instruct", - "name": "Qwen/Qwen2.5-VL-7B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-7B-Instruct", + "id": "llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "display_name": "Llama 4 Scout 17B 16E Instruct", "modalities": { "input": [ "text", @@ -117784,8 +124586,8 @@ ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -117793,92 +124595,95 @@ "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-01-28", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.05, - "output": 0.05 + "input": 0.2, + "output": 0.78 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "id": "mistral-small-2503", + "name": "Mistral Small 3.1", + "display_name": "Mistral Small 3.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "knowledge": "2024-09", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 0.14, - "output": 1.4 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "Qwen/Qwen3-8B", - "name": "Qwen/Qwen3-8B", - "display_name": "Qwen/Qwen3-8B", + "id": "claude-opus-4-1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "knowledge": "2025-03-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.06, - "output": 0.06 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "display_name": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "id": "meta-llama-3-70b-instruct", + "name": "Meta-Llama-3-70B-Instruct", + "display_name": "Meta-Llama-3-70B-Instruct", "modalities": { "input": [ "text" @@ -117888,28 +124693,29 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-30", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 0.09, - "output": 0.3 + "input": 2.68, + "output": 3.54 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "display_name": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "id": "gpt-3.5-turbo-1106", + "name": "GPT-3.5 Turbo 1106", + "display_name": "GPT-3.5 Turbo 1106", "modalities": { "input": [ "text" @@ -117919,134 +124725,177 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-07-23", - "last_updated": "2025-11-25", + "knowledge": "2021-08", + "release_date": "2023-11-06", + "last_updated": "2023-11-06", "cost": { - "input": 0.09, - "output": 0.6 + "input": 1, + "output": 2 }, "type": "chat" }, { - "id": "Qwen/Qwen3-32B", - "name": "Qwen/Qwen3-32B", - "display_name": "Qwen/Qwen3-32B", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.14, - "output": 0.57 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", - "name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-01", - "last_updated": "2025-11-25", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Instruct", - "name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "id": "mai-ds-r1", + "name": "MAI-DS-R1", + "display_name": "MAI-DS-R1", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 66000, - "output": 66000 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.1, - "output": 0.4 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "Qwen/Qwen3-14B", - "name": "Qwen/Qwen3-14B", - "display_name": "Qwen/Qwen3-14B", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -118056,13 +124905,14 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -118076,50 +124926,54 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-12-02", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-72B-Instruct-128K", - "name": "Qwen/Qwen2.5-72B-Instruct-128K", - "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", + "id": "llama-3.2-90b-vision-instruct", + "name": "Llama-3.2-90B-Vision-Instruct", + "display_name": "Llama-3.2-90B-Vision-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 4000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.59, - "output": 0.59 + "input": 2.04, + "output": 2.04 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-32B-Instruct", - "name": "Qwen/Qwen2.5-32B-Instruct", - "display_name": "Qwen/Qwen2.5-32B-Instruct", + "id": "codex-mini", + "name": "Codex Mini", + "display_name": "Codex Mini", "modalities": { "input": [ "text" @@ -118129,41 +124983,45 @@ ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-09-19", - "last_updated": "2025-11-25", + "knowledge": "2024-04", + "release_date": "2025-05-16", + "last_updated": "2025-05-16", "cost": { - "input": 0.18, - "output": 0.18 + "input": 1.5, + "output": 6, + "cache_read": 0.375 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "id": "o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -118172,105 +125030,96 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 0.13, - "output": 0.6 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Thinking", - "name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "id": "cohere-embed-v3-english", + "name": "Embed v3 English", + "display_name": "Embed v3 English", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 66000, - "output": 66000 + "context": 512, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "release_date": "2023-11-07", + "last_updated": "2023-11-07", "cost": { "input": 0.1, - "output": 0.4 + "output": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-32B-Instruct", - "name": "Qwen/Qwen2.5-VL-32B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-32B-Instruct", + "id": "gpt-3.5-turbo-0613", + "name": "GPT-3.5 Turbo 0613", + "display_name": "GPT-3.5 Turbo 0613", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-03-24", - "last_updated": "2025-11-25", + "knowledge": "2021-08", + "release_date": "2023-06-13", + "last_updated": "2023-06-13", "cost": { - "input": 0.27, - "output": 0.27 + "input": 3, + "output": 4 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "name": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "display_name": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "id": "deepseek-v3.1", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ "text" @@ -118280,8 +125129,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -118289,63 +125138,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-11-25", - "cost": { - "input": 0.14, - "output": 0.57 - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262000, - "output": 262000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.3, - "output": 1.5 + "input": 0.56, + "output": 1.68 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-14B-Instruct", - "name": "Qwen/Qwen2.5-14B-Instruct", - "display_name": "Qwen/Qwen2.5-14B-Instruct", + "id": "cohere-command-a", + "name": "Command A", + "display_name": "Command A", "modalities": { "input": [ "text" @@ -118355,28 +125162,30 @@ ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 256000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 0.1, - "output": 0.1 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-30B-A3B-Thinking", - "name": "Qwen/Qwen3-VL-30B-A3B-Thinking", - "display_name": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "id": "mistral-medium-2505", + "name": "Mistral Medium 3", + "display_name": "Mistral Medium 3", "modalities": { "input": [ "text", @@ -118387,104 +125196,93 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-10-11", - "last_updated": "2025-11-25", + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0.29, - "output": 1 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-32B-Instruct", - "name": "Qwen/Qwen3-VL-32B-Instruct", - "display_name": "Qwen/Qwen3-VL-32B-Instruct", + "id": "gpt-4-32k", + "name": "GPT-4 32K", + "display_name": "GPT-4 32K", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-21", - "last_updated": "2025-11-25", + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", "cost": { - "input": 0.2, - "output": 0.6 + "input": 60, + "output": 120 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-8B-Instruct", - "name": "Qwen/Qwen3-VL-8B-Instruct", - "display_name": "Qwen/Qwen3-VL-8B-Instruct", + "id": "meta-llama-3-8b-instruct", + "name": "Meta-Llama-3-8B-Instruct", + "display_name": "Meta-Llama-3-8B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 0.18, - "output": 0.68 + "input": 0.3, + "output": 0.61 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "display_name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "id": "ministral-3b", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ "text" @@ -118494,8 +125292,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -118503,50 +125301,53 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-31", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-03", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.25, - "output": 1 + "input": 0.04, + "output": 0.04 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-72B-Instruct", - "name": "Qwen/Qwen2.5-72B-Instruct", - "display_name": "Qwen/Qwen2.5-72B-Instruct", + "id": "llama-3.2-11b-vision-instruct", + "name": "Llama-3.2-11B-Vision-Instruct", + "display_name": "Llama-3.2-11B-Vision-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.59, - "output": 0.59 + "input": 0.37, + "output": 0.37 }, "type": "chat" }, { - "id": "stepfun-ai/Step-3.5-Flash", - "name": "stepfun-ai/Step-3.5-Flash", - "display_name": "stepfun-ai/Step-3.5-Flash", + "id": "phi-3-mini-4k-instruct", + "name": "Phi-3-mini-instruct (4k)", + "display_name": "Phi-3-mini-instruct (4k)", "modalities": { "input": [ "text" @@ -118556,29 +125357,29 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 4096, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.13, + "output": 0.52 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5", - "name": "zai-org/GLM-4.5", - "display_name": "zai-org/GLM-4.5", + "id": "gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ "text" @@ -118588,8 +125389,8 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -118598,76 +125399,92 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", "cost": { - "input": 0.4, - "output": 2 + "input": 60, + "output": 120 }, "type": "chat" }, { - "id": "zai-org/GLM-5V-Turbo", - "name": "zai-org/GLM-5V-Turbo", - "display_name": "zai-org/GLM-5V-Turbo", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 1.2, - "output": 4, - "cache_write": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7", - "name": "zai-org/GLM-4.7", - "display_name": "zai-org/GLM-4.7", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -118676,28 +125493,40 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, "open_weights": false, - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 0.6, - "output": 2.2 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1", - "name": "zai-org/GLM-5.1", - "display_name": "zai-org/GLM-5.1", + "id": "phi-4-mini", + "name": "Phi-4-mini", + "display_name": "Phi-4-mini", "modalities": { "input": [ "text" @@ -118707,72 +125536,64 @@ ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 1.4, - "output": 4.4, - "cache_write": 0 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5-Air", - "name": "zai-org/GLM-4.5-Air", - "display_name": "zai-org/GLM-4.5-Air", + "id": "gpt-5-chat", + "name": "GPT-5 Chat", + "display_name": "GPT-5 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "knowledge": "2024-10-24", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.14, - "output": 0.86 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "zai-org/GLM-5", - "name": "zai-org/GLM-5", - "display_name": "zai-org/GLM-5", + "id": "meta-llama-3.1-8b-instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" @@ -118782,40 +125603,29 @@ ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 1, - "output": 3.2 + "input": 0.3, + "output": 0.61 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6V", - "name": "zai-org/GLM-4.6V", - "display_name": "zai-org/GLM-4.6V", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ "text", @@ -118826,65 +125636,108 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "release_date": "2025-12-07", - "last_updated": "2025-12-07", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.25, + "output": 2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6", - "name": "zai-org/GLM-4.6", - "display_name": "zai-org/GLM-4.6", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0.5, - "output": 1.9 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5V", - "name": "zai-org/GLM-4.5V", - "display_name": "zai-org/GLM-4.5V", + "id": "gpt-5.2-chat", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ "text", @@ -118895,59 +125748,31 @@ ] }, "limit": { - "context": 66000, - "output": 66000 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-08-13", - "last_updated": "2025-11-25", - "cost": { - "input": 0.14, - "output": 0.86 - }, - "type": "chat" - }, - { - "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", - "name": "meta-llama/Meta-Llama-3.1-8B-Instruct", - "display_name": "meta-llama/Meta-Llama-3.1-8B-Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 33000, - "output": 4000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-23", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.06, - "output": 0.06 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "inclusionAI/Ring-flash-2.0", - "name": "inclusionAI/Ring-flash-2.0", - "display_name": "inclusionAI/Ring-flash-2.0", + "id": "grok-4-20-reasoning", + "name": "Grok 4.20 (Reasoning)", + "display_name": "Grok 4.20 (Reasoning)", "modalities": { "input": [ "text" @@ -118957,8 +125782,8 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 262000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -118973,80 +125798,100 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "knowledge": "2025-09", + "release_date": "2026-04-08", + "last_updated": "2026-04-08", "cost": { - "input": 0.14, - "output": 0.57 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "inclusionAI/Ling-mini-2.0", - "name": "inclusionAI/Ling-mini-2.0", - "display_name": "inclusionAI/Ling-mini-2.0", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-10", - "last_updated": "2025-11-25", - "cost": { - "input": 0.07, - "output": 0.28 - }, - "type": "chat" - }, - { - "id": "inclusionAI/Ling-flash-2.0", - "name": "inclusionAI/Ling-flash-2.0", - "display_name": "inclusionAI/Ling-flash-2.0", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131000, - "output": 131000 + "supported": true, + "default": false }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.14, - "output": 0.57 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "tiers": [ + { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5 + } }, "type": "chat" }, { - "id": "tencent/Hunyuan-A13B-Instruct", - "name": "tencent/Hunyuan-A13B-Instruct", - "display_name": "tencent/Hunyuan-A13B-Instruct", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -119056,8 +125901,8 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -119065,19 +125910,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-06-30", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.71, + "output": 0.71 }, "type": "chat" }, { - "id": "tencent/Hunyuan-MT-7B", - "name": "tencent/Hunyuan-MT-7B", - "display_name": "tencent/Hunyuan-MT-7B", + "id": "grok-4-20-non-reasoning", + "name": "Grok 4.20 (Non-Reasoning)", + "display_name": "Grok 4.20 (Non-Reasoning)", "modalities": { "input": [ "text" @@ -119087,28 +125933,34 @@ ] }, "limit": { - "context": 33000, - "output": 33000 + "context": 262000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "knowledge": "2025-09", + "release_date": "2026-04-08", + "last_updated": "2026-04-08", "cost": { - "input": 0, - "output": 0 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1", - "name": "deepseek-ai/DeepSeek-V3.1", - "display_name": "deepseek-ai/DeepSeek-V3.1", + "id": "o1-mini", + "name": "o1-mini", + "display_name": "o1-mini", "modalities": { "input": [ "text" @@ -119118,29 +125970,45 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 128000, + "output": 65536 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": false, "open_weights": false, - "release_date": "2025-08-25", - "last_updated": "2025-11-25", + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 0.27, - "output": 1 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-vl2", - "name": "deepseek-ai/deepseek-vl2", - "display_name": "deepseek-ai/deepseek-vl2", + "id": "cohere-embed-v-4-0", + "name": "Embed v4", + "display_name": "Embed v4", "modalities": { "input": [ "text", @@ -119151,59 +126019,63 @@ ] }, "limit": { - "context": 4000, - "output": 4000 + "context": 128000, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2024-12-13", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.12, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3", - "name": "deepseek-ai/DeepSeek-V3", - "display_name": "deepseek-ai/DeepSeek-V3", + "id": "gpt-5.3-chat", + "name": "GPT-5.3 Chat", + "display_name": "GPT-5.3 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-26", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.25, - "output": 1 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "id": "phi-4-mini-reasoning", + "name": "Phi-4-mini-reasoning", + "display_name": "Phi-4-mini-reasoning", "modalities": { "input": [ "text" @@ -119213,8 +126085,8 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -119223,30 +126095,32 @@ "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.18, - "output": 0.18 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1", - "name": "deepseek-ai/DeepSeek-R1", - "display_name": "deepseek-ai/DeepSeek-R1", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -119257,39 +126131,36 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "interleaved": true } }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.5, - "output": 2.18 + "input": 0.95, + "output": 4 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "id": "grok-4-fast-reasoning", + "name": "Grok 4 Fast (Reasoning)", + "display_name": "Grok 4 Fast (Reasoning)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -119297,63 +126168,40 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-11-25", - "cost": { - "input": 0.1, - "output": 0.1 - }, - "type": "chat" - }, - { - "id": "deepseek-ai/DeepSeek-V3.2-Exp", - "name": "deepseek-ai/DeepSeek-V3.2-Exp", - "display_name": "deepseek-ai/DeepSeek-V3.2-Exp", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 164000, - "output": 164000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true + "extra_capabilities": { + "reasoning": { + "supported": true + } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-10-10", - "last_updated": "2025-11-25", + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 0.27, - "output": 0.41 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "deepseek-ai/DeepSeek-V3.2", - "display_name": "deepseek-ai/DeepSeek-V3.2", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -119366,125 +126214,171 @@ "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-03", - "last_updated": "2025-12-03", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "cost": { - "input": 0.27, - "output": 0.42 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "deepseek-ai/DeepSeek-V3.1-Terminus", - "display_name": "deepseek-ai/DeepSeek-V3.1-Terminus", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.27, - "output": 1 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "openai/gpt-oss-20b", - "display_name": "openai/gpt-oss-20b", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 8000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-13", - "last_updated": "2025-11-25", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 0.04, - "output": 0.18 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "openai/gpt-oss-120b", - "display_name": "openai/gpt-oss-120b", + "id": "gpt-5.4-nano", + "name": "GPT-5.4 Nano", + "display_name": "GPT-5.4 Nano", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 8000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-13", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.05, - "output": 0.45 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "baidu/ERNIE-4.5-300B-A47B", - "name": "baidu/ERNIE-4.5-300B-A47B", - "display_name": "baidu/ERNIE-4.5-300B-A47B", + "id": "cohere-command-r-plus-08-2024", + "name": "Command R+", + "display_name": "Command R+", "modalities": { "input": [ "text" @@ -119494,8 +126388,8 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, @@ -119503,188 +126397,274 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-02", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0.28, - "output": 1.1 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-9B-0414", - "name": "THUDM/GLM-Z1-9B-0414", - "display_name": "THUDM/GLM-Z1-9B-0414", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.086, - "output": 0.086 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "THUDM/GLM-4-9B-0414", - "name": "THUDM/GLM-4-9B-0414", - "display_name": "THUDM/GLM-4-9B-0414", + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 33000, - "output": 33000 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.086, - "output": 0.086 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "THUDM/GLM-4-32B-0414", - "name": "THUDM/GLM-4-32B-0414", - "display_name": "THUDM/GLM-4-32B-0414", + "id": "gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 33000, - "output": 33000 + "context": 400000, + "output": 272000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 0.27, - "output": 0.27 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-32B-0414", - "name": "THUDM/GLM-Z1-32B-0414", - "display_name": "THUDM/GLM-Z1-32B-0414", + "id": "gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "moonshotai/Kimi-K2-Thinking", - "display_name": "moonshotai/Kimi-K2-Thinking", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-11-07", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.55, - "output": 2.5 + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + }, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "moonshotai/Kimi-K2.6", - "display_name": "moonshotai/Kimi-K2.6", + "id": "gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ "text", @@ -119695,72 +126675,63 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct", - "name": "moonshotai/Kimi-K2-Instruct", - "display_name": "moonshotai/Kimi-K2-Instruct", + "id": "gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-13", - "last_updated": "2025-11-25", + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0.58, - "output": 2.29 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "moonshotai/Kimi-K2-Instruct-0905", - "display_name": "moonshotai/Kimi-K2-Instruct-0905", + "id": "cohere-command-r-08-2024", + "name": "Command R", + "display_name": "Command R", "modalities": { "input": [ "text" @@ -119770,8 +126741,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, @@ -119779,226 +126750,323 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-08", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0.4, - "output": 2 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "moonshotai/Kimi-K2.5", - "display_name": "moonshotai/Kimi-K2.5", + "id": "gpt-5.4-mini", + "name": "GPT-5.4 Mini", + "display_name": "GPT-5.4 Mini", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.45, - "output": 2.25 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMaxAI/MiniMax-M2.5", - "display_name": "MiniMaxAI/MiniMax-M2.5", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 197000, - "output": 131000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-15", - "last_updated": "2026-02-15", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.3, - "output": 1.2 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.1", - "name": "MiniMaxAI/MiniMax-M2.1", - "display_name": "MiniMaxAI/MiniMax-M2.1", + "id": "gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 197000, - "output": 131000 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2025-12-01", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.3, - "output": 1.2 + "input": 5, + "output": 30, + "cache_read": 0.5, + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + }, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "ByteDance-Seed/Seed-OSS-36B-Instruct", - "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", - "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "id": "gpt-5.4-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-04", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.21, - "output": 0.57 + "input": 30, + "output": 180, + "context_over_200k": { + "input": 60, + "output": 270 + }, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" - } - ] - }, - "vercel": { - "id": "vercel", - "name": "Vercel AI Gateway", - "display_name": "Vercel AI Gateway", - "doc": "https://github.com/vercel/ai/tree/5eb85cc45a259553501f535b8ac79a77d0e79223/packages/gateway", - "models": [ + }, { - "id": "alibaba/qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 1, - "output": 5 + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "alibaba/qwen3.6-27b", - "name": "Qwen 3.6 27B", - "display_name": "Qwen 3.6 27B", + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -120007,28 +127075,33 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-22", - "last_updated": "2026-05-01", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.6, - "output": 3.5999999999999996 + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 }, "type": "chat" }, { - "id": "alibaba/qwen3-embedding-8b", - "name": "Qwen3 Embedding 8B", - "display_name": "Qwen3 Embedding 8B", + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" @@ -120038,61 +127111,103 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 200000, + "output": 100000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 0.05, - "output": 0 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, - "type": "embedding" + "type": "chat" }, { - "id": "alibaba/qwen-3-30b", - "name": "Qwen3-30B-A3B", - "display_name": "Qwen3-30B-A3B", + "id": "o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 16384 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.08, - "output": 0.29 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" - }, + } + ] + }, + "minimax-coding-plan": { + "id": "minimax-coding-plan", + "name": "MiniMax Token Plan (minimax.io)", + "display_name": "MiniMax Token Plan (minimax.io)", + "api": "https://api.minimax.io/anthropic/v1", + "doc": "https://platform.minimax.io/docs/token-plan/intro", + "models": [ { - "id": "alibaba/qwen-3-235b", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -120102,42 +127217,45 @@ ] }, "limit": { - "context": 40960, - "output": 16384 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.13, - "output": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "alibaba/qwen3.5-flash", - "name": "Qwen 3.5 Flash", - "display_name": "Qwen 3.5 Flash", + "id": "MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -120156,35 +127274,33 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.001, - "cache_write": 0.125 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "alibaba/qwen3.6-plus", - "name": "Qwen 3.6 Plus", - "display_name": "Qwen 3.6 Plus", + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -120194,31 +127310,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-03", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.09999999999999999, - "cache_write": 0.625 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "alibaba/qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "MiniMax-M2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ "text" @@ -120228,13 +127338,14 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -120248,20 +127359,21 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1.2, - "output": 6 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "alibaba/qwen3-embedding-0.6b", - "name": "Qwen3 Embedding 0.6B", - "display_name": "Qwen3 Embedding 0.6B", + "id": "MiniMax-M2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "display_name": "MiniMax-M2.5-highspeed", "modalities": { "input": [ "text" @@ -120271,28 +127383,36 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 204800, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "open_weights": true, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", "cost": { - "input": 0.01, - "output": 0 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, - "type": "embedding" + "type": "chat" }, { - "id": "alibaba/qwen-3-32b", - "name": "Qwen 3.32B", - "display_name": "Qwen 3.32B", + "id": "MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ "text" @@ -120302,8 +127422,8 @@ ] }, "limit": { - "context": 40960, - "output": 16384 + "context": 196608, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -120311,34 +127431,45 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0, + "output": 0 }, "type": "chat" - }, + } + ] + }, + "upstage": { + "id": "upstage", + "name": "Upstage", + "display_name": "Upstage", + "api": "https://api.upstage.ai/v1/solar", + "doc": "https://developers.upstage.ai/docs/apis/chat", + "models": [ { - "id": "alibaba/qwen-3.6-max-preview", - "name": "Qwen 3.6 Max Preview", - "display_name": "Qwen 3.6 Max Preview", + "id": "solar-pro2", + "name": "solar-pro2", + "display_name": "solar-pro2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 240000, - "output": 64000 + "context": 65536, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -120346,22 +127477,21 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-20", - "last_updated": "2026-04-24", + "attachment": false, + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 1.3, - "output": 7.8, - "cache_read": 0.26, - "cache_write": 1.625 + "input": 0.25, + "output": 0.25 }, "type": "chat" }, { - "id": "alibaba/qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "solar-mini", + "name": "solar-mini", + "display_name": "solar-mini", "modalities": { "input": [ "text" @@ -120371,45 +127501,32 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 32768, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-09-12", - "last_updated": "2025-09-12", + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2024-06-12", + "last_updated": "2025-04-22", "cost": { "input": 0.15, - "output": 1.5 + "output": 0.15 }, "type": "chat" }, { - "id": "alibaba/qwen3-vl-thinking", - "name": "Qwen3 VL Thinking", - "display_name": "Qwen3 VL Thinking", + "id": "solar-pro3", + "name": "solar-pro3", + "display_name": "solar-pro3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -120417,7 +127534,48 @@ }, "limit": { "context": 131072, - "output": 129024 + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2026-01", + "last_updated": "2026-01", + "cost": { + "input": 0.25, + "output": 0.25 + }, + "type": "chat" + } + ] + }, + "amazon-bedrock": { + "id": "amazon-bedrock", + "name": "Amazon Bedrock", + "display_name": "Amazon Bedrock", + "doc": "https://docs.aws.amazon.com/bedrock/latest/userguide/models-supported.html", + "models": [ + { + "id": "zai.glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -120436,21 +127594,21 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.7, - "output": 8.4 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "alibaba/qwen3-235b-a22b-thinking", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "global.anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5 (Global)", + "display_name": "Claude Sonnet 4.5 (Global)", "modalities": { "input": [ "text", @@ -120462,8 +127620,8 @@ ] }, "limit": { - "context": 262114, - "output": 262114 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -120471,32 +127629,23 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.3, - "output": 2.9 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "alibaba/qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "qwen.qwen3-235b-a22b-2507-v1:0", + "name": "Qwen3 235B A22B 2507", + "display_name": "Qwen3 235B A22B 2507", "modalities": { "input": [ "text" @@ -120507,7 +127656,7 @@ }, "limit": { "context": 262144, - "output": 32768 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -120516,19 +127665,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-12", - "last_updated": "2025-09-12", + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 0.09, - "output": 1.1 + "input": 0.22, + "output": 0.88 }, "type": "chat" }, { - "id": "alibaba/qwen3-coder-next", - "name": "Qwen3 Coder Next", - "display_name": "Qwen3 Coder Next", + "id": "zai.glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -120538,8 +127687,8 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 202752, + "output": 101376 }, "temperature": true, "tool_call": true, @@ -120547,51 +127696,66 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-22", - "last_updated": "2026-02-19", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.5, - "output": 1.2 + "input": 1, + "output": 3.2 }, "type": "chat" }, { - "id": "alibaba/qwen3-embedding-4b", - "name": "Qwen3 Embedding 4B", - "display_name": "Qwen3 Embedding 4B", + "id": "amazon.nova-pro-v1:0", + "name": "Nova Pro", + "display_name": "Nova Pro", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 300000, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.02, - "output": 0 + "input": 0.8, + "output": 3.2, + "cache_read": 0.2 }, - "type": "embedding" + "type": "chat" }, { - "id": "alibaba/qwen3-max-thinking", - "name": "Qwen 3 Max Thinking", - "display_name": "Qwen 3 Max Thinking", + "id": "openai.gpt-oss-20b-1:0", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ "text" @@ -120601,74 +127765,65 @@ ] }, "limit": { - "context": 256000, - "output": 65536 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true + "context": 128000, + "output": 16384 }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01", - "last_updated": "2025-01", + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.2, - "output": 6, - "cache_read": 0.24 + "input": 0.07, + "output": 0.3 }, "type": "chat" }, { - "id": "alibaba/qwen3-vl-235b-a22b-instruct", - "name": "Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen3 VL 235B A22B Instruct", + "id": "us.anthropic.claude-haiku-4-5-20251001-v1:0", + "name": "Claude Haiku 4.5 (US)", + "display_name": "Claude Haiku 4.5 (US)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 129024 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-09-24", - "last_updated": "2026-05-01", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.39999999999999997, - "output": 1.5999999999999999 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "alibaba/qwen3-coder", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "writer.palmyra-x4-v1:0", + "name": "Palmyra X4", + "display_name": "Palmyra X4", "modalities": { "input": [ "text" @@ -120678,29 +127833,29 @@ ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 122880, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 0.38, - "output": 1.53 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "alibaba/qwen3-max-preview", - "name": "Qwen3 Max Preview", - "display_name": "Qwen3 Max Preview", + "id": "moonshot.kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -120710,154 +127865,136 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "interleaved": true } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "open_weights": true, + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 1.2, - "output": 6, - "cache_read": 0.24 + "input": 0.6, + "output": 2.5 }, "type": "chat" }, { - "id": "alibaba/qwen3.5-plus", - "name": "Qwen 3.5 Plus", - "display_name": "Qwen 3.5 Plus", + "id": "mistral.ministral-3-8b-instruct", + "name": "Ministral 3 8B", + "display_name": "Ministral 3 8B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-02-16", - "last_updated": "2026-02-19", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.4, - "output": 2.4, - "cache_read": 0.04, - "cache_write": 0.5 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "alibaba/qwen-3-14b", - "name": "Qwen3-14B", - "display_name": "Qwen3-14B", + "id": "meta.llama4-scout-17b-instruct-v1:0", + "name": "Llama 4 Scout 17B Instruct", + "display_name": "Llama 4 Scout 17B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 40960, + "context": 3500000, "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.06, - "output": 0.24 + "input": 0.17, + "output": 0.66 }, "type": "chat" }, { - "id": "alibaba/qwen3-vl-instruct", - "name": "Qwen3 VL Instruct", - "display_name": "Qwen3 VL Instruct", + "id": "us.anthropic.claude-opus-4-5-20251101-v1:0", + "name": "Claude Opus 4.5 (US)", + "display_name": "Claude Opus 4.5 (US)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 129024 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "cost": { - "input": 0.7, - "output": 2.8 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "alibaba/qwen3-coder-30b-a3b", - "name": "Qwen 3 Coder 30B A3B Instruct", - "display_name": "Qwen 3 Coder 30B A3B Instruct", + "id": "qwen.qwen3-coder-480b-a35b-v1:0", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -120867,30 +128004,29 @@ ] }, "limit": { - "context": 160000, - "output": 32768 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 0.07, - "output": 0.27 + "input": 0.22, + "output": 1.8 }, "type": "chat" }, { - "id": "perplexity/sonar-pro", - "name": "Sonar Pro", - "display_name": "Sonar Pro", + "id": "google.gemma-3-27b-it", + "name": "Google Gemma 3 27B Instruct", + "display_name": "Google Gemma 3 27B Instruct", "modalities": { "input": [ "text", @@ -120901,8 +128037,8 @@ ] }, "limit": { - "context": 200000, - "output": 8000 + "context": 202752, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -120910,86 +128046,88 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-27", + "last_updated": "2025-07-27", "cost": { - "input": 3, - "output": 15 + "input": 0.12, + "output": 0.2 }, "type": "chat" }, { - "id": "perplexity/sonar", - "name": "Sonar", - "display_name": "Sonar", + "id": "mistral.ministral-3-14b-instruct", + "name": "Ministral 14B 3.0", + "display_name": "Ministral 14B 3.0", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 127000, - "output": 8000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-02", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 1, - "output": 1 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "perplexity/sonar-reasoning", - "name": "Sonar Reasoning", - "display_name": "Sonar Reasoning", + "id": "us.anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5 (US)", + "display_name": "Claude Sonnet 4.5 (US)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 127000, - "output": 8000 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 1, - "output": 5 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "perplexity/sonar-reasoning-pro", - "name": "Sonar Reasoning Pro", - "display_name": "Sonar Reasoning Pro", + "id": "qwen.qwen3-coder-30b-a3b-v1:0", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ "text" @@ -120999,70 +128137,90 @@ ] }, "limit": { - "context": 127000, - "output": 8000 + "context": 262144, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 2, - "output": 8 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-thinking", - "name": "DeepSeek V3.2 Thinking", - "display_name": "DeepSeek V3.2 Thinking", + "id": "anthropic.claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.28, - "output": 0.42, - "cache_read": 0.03 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-exp", - "name": "DeepSeek V3.2 Exp", - "display_name": "DeepSeek V3.2 Exp", + "id": "zai.glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ "text" @@ -121072,8 +128230,8 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -121082,64 +128240,66 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.27, + "input": 0.07, "output": 0.4 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1", - "name": "DeepSeek-V3.1", - "display_name": "DeepSeek-V3.1", + "id": "google.gemma-3-12b-it", + "name": "Google Gemma 3 12B", + "display_name": "Google Gemma 3 12B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 128000 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.3, - "output": 1 + "input": 0.049999999999999996, + "output": 0.09999999999999999 }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "global.anthropic.claude-opus-4-5-20251101-v1:0", + "name": "Claude Opus 4.5 (Global)", + "display_name": "Claude Opus 4.5 (Global)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -121147,35 +128307,28 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-23", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "au.anthropic.claude-sonnet-4-6", + "name": "AU Anthropic Claude Sonnet 4.6", + "display_name": "AU Anthropic Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -121183,78 +128336,89 @@ }, "limit": { "context": 1000000, - "output": 384000 + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-23", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 3.3, + "output": 16.5, + "cache_read": 0.33, + "cache_write": 4.125 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "qwen.qwen3-vl-235b-a22b", + "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163842, - "output": 8000 + "context": 262000, + "output": 262000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.27, - "output": 0.4, - "cache_read": 0.22 + "input": 0.3, + "output": 1.5 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "meta.llama3-3-70b-instruct-v1:0", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -121264,8 +128428,8 @@ ] }, "limit": { - "context": 163840, - "output": 16384 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -121273,20 +128437,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-12-26", - "last_updated": "2024-12-26", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.77, - "output": 0.77 + "input": 0.72, + "output": 0.72 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1-terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", + "id": "nvidia.nemotron-nano-9b-v2", + "name": "NVIDIA Nemotron Nano 9B v2", + "display_name": "NVIDIA Nemotron Nano 9B v2", "modalities": { "input": [ "text" @@ -121296,117 +128460,134 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.27, - "output": 1 + "input": 0.06, + "output": 0.23 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "us.anthropic.claude-opus-4-7", + "name": "Claude Opus 4.7 (US)", + "display_name": "Claude Opus 4.7 (US)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], "interleaved": true, "summaries": true, - "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-29", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 1.35, - "output": 5.4 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "arcee-ai/trinity-mini", - "name": "Trinity Mini", - "display_name": "Trinity Mini", + "id": "nvidia.nemotron-nano-12b-v2", + "name": "NVIDIA Nemotron Nano 12B v2 VL BF16", + "display_name": "NVIDIA Nemotron Nano 12B v2 VL BF16", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12", - "last_updated": "2025-12", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.05, - "output": 0.15 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "arcee-ai/trinity-large-thinking", - "name": "Trinity Large Thinking", - "display_name": "Trinity Large Thinking", + "id": "anthropic.claude-opus-4-5-20251101-v1:0", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262100, - "output": 80000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -121414,20 +128595,23 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-03", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "cost": { - "input": 0.25, - "output": 0.8999999999999999 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "arcee-ai/trinity-large-preview", - "name": "Trinity Large Preview", - "display_name": "Trinity Large Preview", + "id": "deepseek.v3-v1:0", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ "text" @@ -121437,114 +128621,124 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 163840, + "output": 81920 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-01", - "last_updated": "2025-01", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 0.25, - "output": 1 + "input": 0.58, + "output": 1.68 }, "type": "chat" }, { - "id": "recraft/recraft-v3", - "name": "Recraft V3", - "display_name": "Recraft V3", + "id": "meta.llama4-maverick-17b-instruct-v1:0", + "name": "Llama 4 Maverick 17B Instruct", + "display_name": "Llama 4 Maverick 17B Instruct", "modalities": { "input": [ - "text" - ], - "output": [ + "text", "image" - ] - }, - "limit": { - "context": 512, - "output": 8192 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-10", - "last_updated": "2024-10", - "type": "chat" - }, - { - "id": "recraft/recraft-v2", - "name": "Recraft V2", - "display_name": "Recraft V2", - "modalities": { - "input": [ - "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 512, - "output": 8192 + "context": 1000000, + "output": 16384 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2024-03", - "last_updated": "2024-03", + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "cost": { + "input": 0.24, + "output": 0.97 + }, "type": "chat" }, { - "id": "voyage/voyage-3-large", - "name": "voyage-3-large", - "display_name": "voyage-3-large", + "id": "eu.anthropic.claude-opus-4-7", + "name": "Claude Opus 4.7 (EU)", + "display_name": "Claude Opus 4.7 (EU)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 1000000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-09", - "last_updated": "2024-09", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.18, - "output": 0 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "voyage/voyage-4-large", - "name": "voyage-4-large", - "display_name": "voyage-4-large", + "id": "qwen.qwen3-32b-v1:0", + "name": "Qwen3 32B (dense)", + "display_name": "Qwen3 32B (dense)", "modalities": { "input": [ "text" @@ -121554,86 +128748,65 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2026-03-06", - "last_updated": "2026-03-06", - "type": "chat" - }, - { - "id": "voyage/voyage-3.5-lite", - "name": "voyage-3.5-lite", - "display_name": "voyage-3.5-lite", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 1536 - }, - "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 0.02, - "output": 0 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "voyage/voyage-code-3", - "name": "voyage-code-3", - "display_name": "voyage-code-3", + "id": "amazon.nova-lite-v1:0", + "name": "Nova Lite", + "display_name": "Nova Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 300000, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-09", - "last_updated": "2024-09", + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.18, - "output": 0 + "input": 0.06, + "output": 0.24, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "voyage/voyage-finance-2", - "name": "voyage-finance-2", - "display_name": "voyage-finance-2", + "id": "mistral.devstral-2-123b", + "name": "Devstral 2 123B", + "display_name": "Devstral 2 123B", "modalities": { "input": [ "text" @@ -121643,55 +128816,65 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 256000, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-03", - "last_updated": "2024-03", + "open_weights": true, + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 0.12, - "output": 0 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "voyage/voyage-4-lite", - "name": "voyage-4-lite", - "display_name": "voyage-4-lite", + "id": "eu.anthropic.claude-opus-4-5-20251101-v1:0", + "name": "Claude Opus 4.5 (EU)", + "display_name": "Claude Opus 4.5 (EU)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-06", - "last_updated": "2026-03-06", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + }, "type": "chat" }, { - "id": "voyage/voyage-4", - "name": "voyage-4", - "display_name": "voyage-4", + "id": "openai.gpt-oss-120b-1:0", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ "text" @@ -121701,24 +128884,28 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-03-06", - "last_updated": "2026-03-06", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.15, + "output": 0.6 + }, "type": "chat" }, { - "id": "voyage/voyage-code-2", - "name": "voyage-code-2", - "display_name": "voyage-code-2", + "id": "deepseek.r1-v1:0", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -121728,123 +128915,130 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 128000, + "output": 32768 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2024-01", - "last_updated": "2024-01", + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", "cost": { - "input": 0.12, - "output": 0 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "voyage/voyage-law-2", - "name": "voyage-law-2", - "display_name": "voyage-law-2", + "id": "mistral.mistral-large-3-675b-instruct", + "name": "Mistral Large 3", + "display_name": "Mistral Large 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 256000, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-03", - "last_updated": "2024-03", + "open_weights": true, + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0.12, - "output": 0 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "voyage/voyage-3.5", - "name": "voyage-3.5", - "display_name": "voyage-3.5", + "id": "mistral.magistral-small-2509", + "name": "Magistral Small 1.2", + "display_name": "Magistral Small 1.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 128000, + "output": 40000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "open_weights": true, + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0.06, - "output": 0 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "morph/morph-v3-large", - "name": "Morph v3 Large", - "display_name": "Morph v3 Large", + "id": "mistral.pixtral-large-2502-v1:0", + "name": "Pixtral Large (25.02)", + "display_name": "Pixtral Large (25.02)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 128000, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "release_date": "2025-04-08", + "last_updated": "2025-04-08", "cost": { - "input": 0.9, - "output": 1.9 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "morph/morph-v3-fast", - "name": "Morph v3 Fast", - "display_name": "Morph v3 Fast", + "id": "mistral.voxtral-mini-3b-2507", + "name": "Voxtral Mini 3B 2507", + "display_name": "Voxtral Mini 3B 2507", "modalities": { "input": [ + "audio", "text" ], "output": [ @@ -121852,41 +129046,39 @@ ] }, "limit": { - "context": 16000, - "output": 16000 + "context": 128000, + "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.8, - "output": 1.2 + "input": 0.04, + "output": 0.04 }, "type": "chat" }, { - "id": "zai/glm-5v-turbo", - "name": "GLM 5V Turbo", - "display_name": "GLM 5V Turbo", + "id": "writer.palmyra-x5-v1:0", + "name": "Palmyra X5", + "display_name": "Palmyra X5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 1040000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -121894,21 +129086,20 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-03", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24 + "input": 0.6, + "output": 6 }, "type": "chat" }, { - "id": "zai/glm-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "minimax.minimax-m2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "modalities": { "input": [ "text" @@ -121918,8 +129109,8 @@ ] }, "limit": { - "context": 202752, - "output": 120000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -121927,33 +129118,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.43, - "output": 1.75, - "cache_read": 0.08 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "zai/glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "qwen.qwen3-next-80b-a3b", + "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", "modalities": { "input": [ "text" @@ -121963,126 +129141,128 @@ ] }, "limit": { - "context": 202800, - "output": 131072 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-19", + "open_weights": false, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 0.14, + "output": 1.4 }, "type": "chat" }, { - "id": "zai/glm-4.7-flashx", - "name": "GLM 4.7 FlashX", - "display_name": "GLM 4.7 FlashX", + "id": "au.anthropic.claude-opus-4-6-v1", + "name": "AU Anthropic Claude Opus 4.6", + "display_name": "AU Anthropic Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 1000000, "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01", - "last_updated": "2025-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.06, - "output": 0.4, - "cache_read": 0.01 + "input": 16.5, + "output": 82.5, + "cache_read": 1.65, + "cache_write": 20.625 }, "type": "chat" }, { - "id": "zai/glm-5.1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "meta.llama3-1-8b-instruct-v1:0", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 202752 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-07", - "last_updated": "2026-04-16", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 0.22, + "output": 0.22 }, "type": "chat" }, { - "id": "zai/glm-4.6v-flash", - "name": "GLM-4.6V-Flash", - "display_name": "GLM-4.6V-Flash", + "id": "amazon.nova-2-lite-v1:0", + "name": "Nova 2 Lite", + "display_name": "Nova 2 Lite", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" @@ -122090,36 +129270,39 @@ }, "limit": { "context": 128000, - "output": 24000 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "cost": { + "input": 0.33, + "output": 2.75 + }, "type": "chat" }, { - "id": "zai/glm-4.5", - "name": "GLM 4.5", - "display_name": "GLM 4.5", + "id": "moonshotai.kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -122135,19 +129318,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2026-02-06", + "last_updated": "2026-02-06", "cost": { "input": 0.6, - "output": 2.2 + "output": 3 }, "type": "chat" }, { - "id": "zai/glm-4.5-air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "nvidia.nemotron-super-3-120b", + "name": "NVIDIA Nemotron 3 Super 120B A12B", + "display_name": "NVIDIA Nemotron 3 Super 120B A12B", "modalities": { "input": [ "text" @@ -122157,8 +129339,8 @@ ] }, "limit": { - "context": 128000, - "output": 96000 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -122168,19 +129350,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2026-03-11", + "last_updated": "2026-03-11", "cost": { - "input": 0.2, - "output": 1.1 + "input": 0.15, + "output": 0.65 }, "type": "chat" }, { - "id": "zai/glm-5-turbo", - "name": "GLM 5 Turbo", - "display_name": "GLM 5 Turbo", + "id": "qwen.qwen3-coder-next", + "name": "Qwen3 Coder Next", + "display_name": "Qwen3 Coder Next", "modalities": { "input": [ "text" @@ -122190,8 +129371,8 @@ ] }, "limit": { - "context": 202800, - "output": 131100 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -122199,26 +129380,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-17", + "open_weights": true, + "release_date": "2026-02-06", + "last_updated": "2026-02-06", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24 + "input": 0.22, + "output": 1.8 }, "type": "chat" }, { - "id": "zai/glm-4.5v", - "name": "GLM 4.5V", - "display_name": "GLM 4.5V", + "id": "mistral.ministral-3-3b-instruct", + "name": "Ministral 3 3B", + "display_name": "Ministral 3 3B", "modalities": { "input": [ "text", @@ -122229,33 +129404,33 @@ ] }, "limit": { - "context": 66000, - "output": 66000 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0.6, - "output": 1.8 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "zai/glm-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "eu.anthropic.claude-haiku-4-5-20251001-v1:0", + "name": "Claude Haiku 4.5 (EU)", + "display_name": "Claude Haiku 4.5 (EU)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -122263,7 +129438,7 @@ }, "limit": { "context": 200000, - "output": 96000 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -122271,40 +129446,34 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.45, - "output": 1.8 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "zai/glm-4.6v", - "name": "GLM-4.6V", - "display_name": "GLM-4.6V", + "id": "minimax.minimax-m2", + "name": "MiniMax M2", + "display_name": "MiniMax M2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 24000 + "context": 204608, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -122312,22 +129481,20 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "attachment": false, + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { "input": 0.3, - "output": 0.9, - "cache_read": 0.05 + "output": 1.2 }, "type": "chat" }, { - "id": "zai/glm-4.7-flash", - "name": "GLM 4.7 Flash", - "display_name": "GLM 4.7 Flash", + "id": "meta.llama3-1-70b-instruct-v1:0", + "name": "Llama 3.1 70B Instruct", + "display_name": "Llama 3.1 70B Instruct", "modalities": { "input": [ "text" @@ -122337,34 +129504,29 @@ ] }, "limit": { - "context": 200000, - "output": 131000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-13", - "last_updated": "2026-03-13", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.07, - "output": 0.39999999999999997 + "input": 0.72, + "output": 0.72 }, "type": "chat" }, { - "id": "cohere/command-a", - "name": "Command A", - "display_name": "Command A", + "id": "openai.gpt-oss-safeguard-120b", + "name": "GPT OSS Safeguard 120B", + "display_name": "GPT OSS Safeguard 120B", "modalities": { "input": [ "text" @@ -122374,8 +129536,8 @@ ] }, "limit": { - "context": 256000, - "output": 8000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -122384,50 +129546,55 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "release_date": "2025-10-29", + "last_updated": "2025-10-29", "cost": { - "input": 2.5, - "output": 10 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "cohere/embed-v4.0", - "name": "Embed v4.0", - "display_name": "Embed v4.0", + "id": "global.anthropic.claude-haiku-4-5-20251001-v1:0", + "name": "Claude Haiku 4.5 (Global)", + "display_name": "Claude Haiku 4.5 (Global)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 200000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.12, - "output": 0 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "prime-intellect/intellect-3", - "name": "INTELLECT 3", - "display_name": "INTELLECT 3", + "id": "amazon.nova-micro-v1:0", + "name": "Nova Micro", + "display_name": "Nova Micro", "modalities": { "input": [ "text" @@ -122437,30 +129604,30 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, "knowledge": "2024-10", - "release_date": "2025-11-26", - "last_updated": "2025-11-26", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.2, - "output": 1.1 + "input": 0.035, + "output": 0.14, + "cache_read": 0.00875 }, "type": "chat" }, { - "id": "xai/grok-4.3", - "name": "Grok 4.3", - "display_name": "Grok 4.3", + "id": "anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", @@ -122472,8 +129639,8 @@ ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -122481,26 +129648,23 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": true, "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-05-01", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.19999999999999998 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "xai/grok-4.20-non-reasoning", - "name": "Grok 4.20 Non-Reasoning", - "display_name": "Grok 4.20 Non-Reasoning", + "id": "eu.anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5 (EU)", + "display_name": "Claude Sonnet 4.5 (EU)", "modalities": { "input": [ "text", @@ -122512,42 +129676,44 @@ ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-23", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.19999999999999998 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "xai/grok-4.20-non-reasoning-beta", - "name": "Grok 4.20 Beta Non-Reasoning", - "display_name": "Grok 4.20 Beta Non-Reasoning", + "id": "mistral.voxtral-small-24b-2507", + "name": "Voxtral Small 24B 2507", + "display_name": "Voxtral Small 24B 2507", "modalities": { "input": [ "text", - "image", - "pdf" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 32000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -122555,33 +129721,30 @@ "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-03-11", - "last_updated": "2026-03-13", + "open_weights": true, + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.19999999999999998 + "input": 0.15, + "output": 0.35 }, "type": "chat" }, { - "id": "xai/grok-4.20-reasoning", - "name": "Grok 4.20 Reasoning", - "display_name": "Grok 4.20 Reasoning", + "id": "nvidia.nemotron-nano-3-30b", + "name": "NVIDIA Nemotron Nano 3 30B", + "display_name": "NVIDIA Nemotron Nano 3 30B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -122589,110 +129752,150 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-23", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.19999999999999998 + "input": 0.06, + "output": 0.24 }, "type": "chat" }, { - "id": "xai/grok-imagine-image", - "name": "Grok Imagine Image", - "display_name": "Grok Imagine Image", + "id": "anthropic.claude-haiku-4-5-20251001-v1:0", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-01-28", - "last_updated": "2026-02-19", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "cost": { + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + }, "type": "chat" }, { - "id": "xai/grok-4.20-multi-agent-beta", - "name": "Grok 4.20 Multi Agent Beta", - "display_name": "Grok 4.20 Multi Agent Beta", + "id": "google.gemma-3-4b-it", + "name": "Gemma 3 4B IT", + "display_name": "Gemma 3 4B IT", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-03-11", - "last_updated": "2026-03-13", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.19999999999999998 + "input": 0.04, + "output": 0.08 }, "type": "chat" }, { - "id": "xai/grok-imagine-image-pro", - "name": "Grok Imagine Image Pro", - "display_name": "Grok Imagine Image Pro", + "id": "global.anthropic.claude-opus-4-7", + "name": "Claude Opus 4.7 (Global)", + "display_name": "Claude Opus 4.7 (Global)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1000000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-01-28", - "last_updated": "2026-02-19", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + }, "type": "chat" }, { - "id": "xai/grok-4-fast-reasoning", - "name": "Grok 4 Fast Reasoning", - "display_name": "Grok 4 Fast Reasoning", + "id": "minimax.minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -122702,8 +129905,8 @@ ] }, "limit": { - "context": 2000000, - "output": 256000 + "context": 196608, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -122711,27 +129914,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "xai/grok-4.1-fast-non-reasoning", - "name": "Grok 4.1 Fast Non-Reasoning", - "display_name": "Grok 4.1 Fast Non-Reasoning", + "id": "openai.gpt-oss-safeguard-20b", + "name": "GPT OSS Safeguard 20B", + "display_name": "GPT OSS Safeguard 20B", "modalities": { "input": [ "text" @@ -122741,8 +129937,8 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -122751,33 +129947,29 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2025-10-29", + "last_updated": "2025-10-29", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.07, + "output": 0.2 }, "type": "chat" }, { - "id": "xai/grok-4.20-reasoning-beta", - "name": "Grok 4.20 Beta Reasoning", - "display_name": "Grok 4.20 Beta Reasoning", + "id": "deepseek.v3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 163840, + "output": 81920 }, "temperature": true, "tool_call": true, @@ -122785,155 +129977,243 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-11", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2026-02-06", + "last_updated": "2026-02-06", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.19999999999999998 + "input": 0.62, + "output": 1.85 }, "type": "chat" }, { - "id": "xai/grok-4.20-multi-agent", - "name": "Grok 4.20 Multi-Agent", - "display_name": "Grok 4.20 Multi-Agent", + "id": "global.anthropic.claude-opus-4-6-v1", + "name": "Claude Opus 4.6 (Global)", + "display_name": "Claude Opus 4.6 (Global)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-23", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.19999999999999998 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "xai/grok-4.1-fast-reasoning", - "name": "Grok 4.1 Fast Reasoning", - "display_name": "Grok 4.1 Fast Reasoning", + "id": "anthropic.claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "xai/grok-4-fast-non-reasoning", - "name": "Grok 4 Fast (Non-Reasoning)", - "display_name": "Grok 4 Fast (Non-Reasoning)", + "id": "global.anthropic.claude-sonnet-4-6", + "name": "Claude Sonnet 4.6 (Global)", + "display_name": "Claude Sonnet 4.6 (Global)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "xai/grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "us.meta.llama4-maverick-17b-instruct-v1:0", + "name": "Llama 4 Maverick 17B Instruct (US)", + "display_name": "Llama 4 Maverick 17B Instruct (US)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0.24, + "output": 0.97 }, "type": "chat" }, { - "id": "xai/grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "us.deepseek.r1-v1:0", + "name": "DeepSeek-R1 (US)", + "display_name": "DeepSeek-R1 (US)", "modalities": { "input": [ "text" @@ -122943,8 +130223,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -122954,66 +130234,69 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", "cost": { - "input": 0.3, - "output": 0.5, - "reasoning": 0.5, - "cache_read": 0.075 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "xai/grok-2-vision", - "name": "Grok 2 Vision", - "display_name": "Grok 2 Vision", + "id": "au.anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5 (AU)", + "display_name": "Claude Sonnet 4.5 (AU)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "xai/grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "us.anthropic.claude-opus-4-1-20250805-v1:0", + "name": "Claude Opus 4.1 (US)", + "display_name": "Claude Opus 4.1 (US)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -123021,39 +130304,36 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 3, - "output": 15, - "reasoning": 15, - "cache_read": 0.75 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "xai/grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "anthropic.claude-opus-4-1-20250805-v1:0", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -123061,171 +130341,288 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "xai/grok-3-fast", - "name": "Grok 3 Fast", - "display_name": "Grok 3 Fast", + "id": "us.anthropic.claude-sonnet-4-6", + "name": "Claude Sonnet 4.6 (US)", + "display_name": "Claude Sonnet 4.6 (US)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 5, - "output": 25, - "cache_read": 1.25 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "xai/grok-3-mini-fast", - "name": "Grok 3 Mini Fast", - "display_name": "Grok 3 Mini Fast", + "id": "anthropic.claude-opus-4-6-v1", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.6, - "output": 4, - "reasoning": 4, - "cache_read": 0.15 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-super-120b-a12b", - "name": "NVIDIA Nemotron 3 Super 120B A12B", - "display_name": "NVIDIA Nemotron 3 Super 120B A12B", + "id": "eu.anthropic.claude-sonnet-4-6", + "name": "Claude Sonnet 4.6 (EU)", + "display_name": "Claude Sonnet 4.6 (EU)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 1000000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-03-18", - "last_updated": "2026-03-30", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.15, - "output": 0.65 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-nano-30b-a3b", - "name": "Nemotron 3 Nano 30B A3B", - "display_name": "Nemotron 3 Nano 30B A3B", + "id": "eu.anthropic.claude-opus-4-6-v1", + "name": "Claude Opus 4.6 (EU)", + "display_name": "Claude Opus 4.6 (EU)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12", - "last_updated": "2024-12", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.06, - "output": 0.24 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "nvidia/nemotron-nano-12b-v2-vl", - "name": "Nvidia Nemotron Nano 12B V2 VL", - "display_name": "Nvidia Nemotron Nano 12B V2 VL", + "id": "au.anthropic.claude-haiku-4-5-20251001-v1:0", + "name": "Claude Haiku 4.5 (AU)", + "display_name": "Claude Haiku 4.5 (AU)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -123235,30 +130632,34 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12", - "last_updated": "2024-12", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.2, - "output": 0.6 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "nvidia/nemotron-nano-9b-v2", - "name": "Nvidia Nemotron Nano 9B V2", - "display_name": "Nvidia Nemotron Nano 9B V2", + "id": "jp.anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5 (JP)", + "display_name": "Claude Sonnet 4.5 (JP)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -123266,97 +130667,160 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-18", - "last_updated": "2025-08-18", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.04, - "output": 0.16 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "inception/mercury-edit-2", - "name": "Mercury Edit 2", - "display_name": "Mercury Edit 2", + "id": "jp.anthropic.claude-sonnet-4-6", + "name": "Claude Sonnet 4.6 (JP)", + "display_name": "Claude Sonnet 4.6 (JP)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-03-30", - "last_updated": "2026-03-30", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.25, - "output": 0.75, - "cache_read": 0.025 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "inception/mercury-2", - "name": "Mercury 2", - "display_name": "Mercury 2", + "id": "us.anthropic.claude-opus-4-6-v1", + "name": "Claude Opus 4.6 (US)", + "display_name": "Claude Opus 4.6 (US)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 1000000, "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-03-06", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.25, - "output": 0.75, - "cache_read": 0.024999999999999998 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "inception/mercury-coder-small", - "name": "Mercury Coder Small Beta", - "display_name": "Mercury Coder Small Beta", + "id": "us.meta.llama4-scout-17b-instruct-v1:0", + "name": "Llama 4 Scout 17B Instruct (US)", + "display_name": "Llama 4 Scout 17B Instruct (US)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, + "context": 3500000, "output": 16384 }, "temperature": true, @@ -123364,20 +130828,21 @@ "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-02-26", - "last_updated": "2026-05-01", + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.25, - "output": 1 + "input": 0.17, + "output": 0.66 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-max", - "name": "GPT 5.1 Codex Max", - "display_name": "GPT 5.1 Codex Max", + "id": "jp.anthropic.claude-opus-4-7", + "name": "Claude Opus 4.7 (JP)", + "display_name": "Claude Opus 4.7 (JP)", "modalities": { "input": [ "text", @@ -123389,10 +130854,10 @@ ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -123403,51 +130868,61 @@ "supported": true, "default_enabled": false, "mode": "effort", - "effort": "none", + "effort": "high", "effort_options": [ - "none", "low", "medium", - "high" + "high", + "xhigh" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" - }, + } + ] + }, + "vercel": { + "id": "vercel", + "name": "Vercel AI Gateway", + "display_name": "Vercel AI Gateway", + "doc": "https://github.com/vercel/ai/tree/5eb85cc45a259553501f535b8ac79a77d0e79223/packages/gateway", + "models": [ { - "id": "openai/gpt-5.2-chat", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", + "id": "prime-intellect/intellect-3", + "name": "INTELLECT 3", + "display_name": "INTELLECT 3", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -123455,22 +130930,21 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-11-26", + "last_updated": "2025-11-26", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.18 + "input": 0.2, + "output": 1.1 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini-search-preview", - "name": "GPT 4o Mini Search Preview", - "display_name": "GPT 4o Mini Search Preview", + "id": "inception/mercury-edit-2", + "name": "Mercury Edit 2", + "display_name": "Mercury Edit 2", "modalities": { "input": [ "text" @@ -123481,41 +130955,71 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 8192 }, "temperature": true, "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-30", + "last_updated": "2026-03-30", + "cost": { + "input": 0.25, + "output": 0.75, + "cache_read": 0.025 + }, + "type": "chat" + }, + { + "id": "inception/mercury-coder-small", + "name": "Mercury Coder Small Beta", + "display_name": "Mercury Coder Small Beta", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2025-01", - "last_updated": "2025-01", + "release_date": "2025-02-26", + "last_updated": "2026-05-01", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "openai/codex-mini", - "name": "Codex Mini", - "display_name": "Codex Mini", + "id": "inception/mercury-2", + "name": "Mercury 2", + "display_name": "Mercury 2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -123523,22 +131027,21 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-05-16", - "last_updated": "2025-05-16", + "release_date": "2026-02-24", + "last_updated": "2026-03-06", "cost": { - "input": 1.5, - "output": 6, - "cache_read": 0.38 + "input": 0.25, + "output": 0.75, + "cache_read": 0.024999999999999998 }, "type": "chat" }, { - "id": "openai/gpt-5-chat", - "name": "GPT-5 Chat", - "display_name": "GPT-5 Chat", + "id": "zai/glm-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ "text", @@ -123546,13 +131049,12 @@ "pdf" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 202752, + "output": 202752 }, "temperature": true, "tool_call": true, @@ -123560,22 +131062,26 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2026-04-07", + "last_updated": "2026-04-16", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "openai/gpt-5.3-chat", - "name": "GPT-5.3 Chat", - "display_name": "GPT-5.3 Chat", + "id": "zai/glm-5v-turbo", + "name": "GLM 5V Turbo", + "display_name": "GLM 5V Turbo", "modalities": { "input": [ "text", @@ -123587,8 +131093,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -123598,19 +131104,19 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-03-03", - "last_updated": "2026-03-06", + "release_date": "2026-04-01", + "last_updated": "2026-04-03", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 1.2, + "output": 4, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "openai/gpt-5.2-pro", - "name": "GPT 5.2 ", - "display_name": "GPT 5.2 ", + "id": "zai/glm-4.6v-flash", + "name": "GLM-4.6V-Flash", + "display_name": "GLM-4.6V-Flash", "modalities": { "input": [ "text", @@ -123622,8 +131128,8 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 24000 }, "temperature": true, "tool_call": true, @@ -123631,41 +131137,17 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 21, - "output": 168 - }, + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "type": "chat" }, { - "id": "openai/text-embedding-3-large", - "name": "text-embedding-3-large", - "display_name": "text-embedding-3-large", + "id": "zai/glm-4.7-flashx", + "name": "GLM 4.7 FlashX", + "display_name": "GLM 4.7 FlashX", "modalities": { "input": [ "text" @@ -123675,41 +131157,48 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 200000, + "output": 128000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 0.13, - "output": 0 + "input": 0.06, + "output": 0.4, + "cache_read": 0.01 }, - "type": "embedding" + "type": "chat" }, { - "id": "openai/gpt-5.5", - "name": "GPT 5.5", - "display_name": "GPT 5.5", + "id": "zai/glm-4.5-air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 128000, + "output": 96000 }, "temperature": true, "tool_call": true, @@ -123717,55 +131206,33 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5 + "input": 0.2, + "output": 1.1 }, "type": "chat" }, { - "id": "openai/gpt-5.3-codex", - "name": "GPT 5.3 Codex", - "display_name": "GPT 5.3 Codex", + "id": "zai/glm-4.5v", + "name": "GLM 4.5V", + "display_name": "GLM 4.5V", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 66000, + "output": 66000 }, "temperature": true, "tool_call": true, @@ -123773,42 +131240,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, - "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.6, + "output": 1.8 }, "type": "chat" }, { - "id": "openai/text-embedding-ada-002", - "name": "text-embedding-ada-002", - "display_name": "text-embedding-ada-002", + "id": "zai/glm-4.7-flash", + "name": "GLM 4.7 Flash", + "display_name": "GLM 4.7 Flash", "modalities": { "input": [ "text" @@ -123818,101 +131264,86 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 200000, + "output": 131000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2022-12-15", - "last_updated": "2022-12-15", + "release_date": "2026-03-13", + "last_updated": "2026-03-13", "cost": { - "input": 0.1, - "output": 0 + "input": 0.07, + "output": 0.39999999999999997 }, - "type": "embedding" + "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "zai/glm-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 96000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.18 + "input": 0.45, + "output": 1.8 }, "type": "chat" }, { - "id": "openai/o3-pro", - "name": "o3 Pro", - "display_name": "o3 Pro", + "id": "zai/glm-4.5", + "name": "GLM 4.5", + "display_name": "GLM 4.5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -123921,159 +131352,118 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 20, - "output": 80 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "openai/gpt-5.4-mini", - "name": "GPT 5.4 Mini", - "display_name": "GPT 5.4 Mini", + "id": "zai/glm-5-turbo", + "name": "GLM 5 Turbo", + "display_name": "GLM 5 Turbo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 202800, + "output": 131100 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-17", + "release_date": "2026-03-15", "last_updated": "2026-03-17", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 1.2, + "output": 4, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "openai/gpt-5.4-nano", - "name": "GPT 5.4 Nano", - "display_name": "GPT 5.4 Nano", + "id": "zai/glm-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 202752, + "output": 120000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2024-10", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.19999999999999998, - "output": 1.25, - "cache_read": 0.02 + "input": 0.43, + "output": 1.75, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "openai/gpt-5.2-codex", - "name": "GPT-5.2-Codex", - "display_name": "GPT-5.2-Codex", + "id": "zai/glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 202800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -124084,40 +131474,29 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12", - "last_updated": "2025-12", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-19", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex mini", - "display_name": "GPT-5.1 Codex mini", + "id": "zai/glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ "text", @@ -124129,164 +131508,94 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 24000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, "open_weights": false, "knowledge": "2024-10", - "release_date": "2025-05-16", - "last_updated": "2025-05-16", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 + "input": 0.3, + "output": 0.9, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "openai/gpt-5.1-thinking", - "name": "GPT 5.1 Thinking", - "display_name": "GPT 5.1 Thinking", + "id": "cohere/embed-v4.0", + "name": "Embed v4.0", + "display_name": "Embed v4.0", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 1536 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.12, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-5.4-pro", - "name": "GPT 5.4 Pro", - "display_name": "GPT 5.4 Pro", + "id": "cohere/command-a", + "name": "Command A", + "display_name": "Command A", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 256000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-05", - "last_updated": "2026-03-06", + "knowledge": "2024-10", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 30, - "output": 180 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo", - "name": "GPT-3.5 Turbo", - "display_name": "GPT-3.5 Turbo", + "id": "voyage/voyage-4-lite", + "name": "voyage-4-lite", + "display_name": "voyage-4-lite", "modalities": { "input": [ "text" @@ -124296,8 +131605,8 @@ ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 32000, + "output": 8192 }, "temperature": true, "tool_call": false, @@ -124306,69 +131615,41 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2021-09", - "release_date": "2023-03-01", - "last_updated": "2023-03-01", - "cost": { - "input": 0.5, - "output": 1.5 - }, + "release_date": "2026-03-06", + "last_updated": "2026-03-06", "type": "chat" }, { - "id": "openai/o3-deep-research", - "name": "o3-deep-research", - "display_name": "o3-deep-research", + "id": "voyage/voyage-4", + "name": "voyage-4", + "display_name": "voyage-4", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 32000, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-06-26", - "last_updated": "2024-06-26", - "cost": { - "input": 10, - "output": 40, - "cache_read": 2.5 - }, + "release_date": "2026-03-06", + "last_updated": "2026-03-06", "type": "chat" }, { - "id": "openai/text-embedding-3-small", - "name": "text-embedding-3-small", - "display_name": "text-embedding-3-small", + "id": "voyage/voyage-3.5", + "name": "voyage-3.5", + "display_name": "voyage-3.5", "modalities": { "input": [ "text" @@ -124388,75 +131669,49 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 0.02, + "input": 0.06, "output": 0 }, - "type": "embedding" + "type": "chat" }, { - "id": "openai/gpt-5.4", - "name": "GPT 5.4", - "display_name": "GPT 5.4", + "id": "voyage/voyage-law-2", + "name": "voyage-law-2", + "display_name": "voyage-law-2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-05", - "last_updated": "2026-03-06", + "release_date": "2024-03", + "last_updated": "2024-03", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 0.12, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "voyage/voyage-3.5-lite", + "name": "voyage-3.5-lite", + "display_name": "voyage-3.5-lite", "modalities": { "input": [ "text" @@ -124466,86 +131721,59 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 0.07, - "output": 0.3 + "input": 0.02, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-5-pro", - "name": "GPT-5 pro", - "display_name": "GPT-5 pro", + "id": "voyage/voyage-3-large", + "name": "voyage-3-large", + "display_name": "voyage-3-large", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 272000 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 15, - "output": 120 + "input": 0.18, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-oss-safeguard-20b", - "name": "gpt-oss-safeguard-20b", - "display_name": "gpt-oss-safeguard-20b", + "id": "voyage/voyage-finance-2", + "name": "voyage-finance-2", + "display_name": "voyage-finance-2", "modalities": { "input": [ "text" @@ -124555,31 +131783,28 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2024-03", + "last_updated": "2024-03", "cost": { - "input": 0.08, - "output": 0.3, - "cache_read": 0.04 + "input": 0.12, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "voyage/voyage-code-2", + "name": "voyage-code-2", + "display_name": "voyage-code-2", "modalities": { "input": [ "text" @@ -124589,69 +131814,55 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "release_date": "2024-01", + "last_updated": "2024-01", "cost": { - "input": 0.1, - "output": 0.5 + "input": 0.12, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-5.5-pro", - "name": "GPT 5.5 Pro", - "display_name": "GPT 5.5 Pro", + "id": "voyage/voyage-4-large", + "name": "voyage-4-large", + "display_name": "voyage-4-large", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 32000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-04-24", - "cost": { - "input": 30, - "output": 180 - }, + "release_date": "2026-03-06", + "last_updated": "2026-03-06", "type": "chat" }, { - "id": "openai/gpt-3.5-turbo-instruct", - "name": "GPT-3.5 Turbo Instruct", - "display_name": "GPT-3.5 Turbo Instruct", + "id": "voyage/voyage-code-3", + "name": "voyage-code-3", + "display_name": "voyage-code-3", "modalities": { "input": [ "text" @@ -124662,319 +131873,246 @@ }, "limit": { "context": 8192, - "output": 4096 + "output": 1536 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2021-09", - "release_date": "2023-03-01", - "last_updated": "2023-03-01", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 1.5, - "output": 2 + "input": 0.18, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-5.1-instant", - "name": "GPT-5.1 Instant", - "display_name": "GPT-5.1 Instant", + "id": "bytedance/seed-1.6", + "name": "Seed 1.6", + "display_name": "Seed 1.6", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.25, + "output": 2, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex", - "name": "GPT-5.1-Codex", - "display_name": "GPT-5.1-Codex", + "id": "bytedance/seed-1.8", + "name": "Seed 1.8", + "display_name": "Seed 1.8", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-10", + "last_updated": "2025-10", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.25, + "output": 2, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "bfl/flux-pro-1.0-fill", + "name": "FLUX.1 Fill [pro]", + "display_name": "FLUX.1 Fill [pro]", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 512, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 - }, + "release_date": "2024-10", + "last_updated": "2024-10", "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "bfl/flux-kontext-max", + "name": "FLUX.1 Kontext Max", + "display_name": "FLUX.1 Kontext Max", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 512, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, + "release_date": "2025-06", + "last_updated": "2025-06", "type": "chat" }, { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "bfl/flux-pro-1.1", + "name": "FLUX1.1 [pro]", + "display_name": "FLUX1.1 [pro]", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 512, + "output": 8192 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, + "release_date": "2024-10", + "last_updated": "2024-10", "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "bfl/flux-pro-1.1-ultra", + "name": "FLUX1.1 [pro] Ultra", + "display_name": "FLUX1.1 [pro] Ultra", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 512, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", - "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "release_date": "2024-11", + "last_updated": "2024-11", + "type": "chat" + }, + { + "id": "bfl/flux-kontext-pro", + "name": "FLUX.1 Kontext Pro", + "display_name": "FLUX.1 Kontext Pro", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 512, + "output": 8192 }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-06", + "last_updated": "2025-06", "type": "chat" }, { - "id": "openai/o3", - "name": "o3", - "display_name": "o3", + "id": "moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -124983,81 +132121,106 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-26", + "last_updated": "2026-01-26", + "cost": { + "input": 0.6, + "output": 1.2 + }, + "type": "chat" + }, + { + "id": "moonshotai/kimi-k2-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.6, + "output": 2.5 }, "type": "chat" }, { - "id": "openai/gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "moonshotai/kimi-k2-turbo", + "name": "Kimi K2 Turbo", + "display_name": "Kimi K2 Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-08", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.03 + "input": 2.4, + "output": 10 }, "type": "chat" }, { - "id": "openai/gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 216144, + "output": 216144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -125066,40 +132229,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.47, + "output": 2, + "cache_read": 0.14 }, "type": "chat" }, { - "id": "openai/o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "moonshotai/kimi-k2-thinking-turbo", + "name": "Kimi K2 Thinking Turbo", + "display_name": "Kimi K2 Thinking Turbo", "modalities": { "input": [ "text" @@ -125109,10 +132262,10 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262114, + "output": 262114 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -125121,33 +132274,25 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true } }, "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 1.15, + "output": 8, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "openai/o1", - "name": "o1", - "display_name": "o1", + "id": "moonshotai/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", @@ -125159,10 +132304,10 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -125170,88 +132315,60 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "open_weights": true, + "release_date": "2026-04-20", + "last_updated": "2026-04-24", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "moonshotai/kimi-k2", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "mistral/mistral-medium", + "name": "Mistral Medium 3.1", + "display_name": "Mistral Medium 3.1", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -125259,7 +132376,7 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -125268,109 +132385,110 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "knowledge": "2024-10", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "openai/gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "mistral/devstral-2", + "name": "Devstral 2", + "display_name": "Devstral 2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2024-10", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", + "type": "chat" + }, + { + "id": "mistral/codestral-embed", + "name": "Codestral Embed", + "display_name": "Codestral Embed", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 1536 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 10, - "output": 30 + "input": 0.15, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "mistral/mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 60288, + "output": 16000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-04", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 0.04, + "output": 0.17 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "mistral/mistral-large-3", + "name": "Mistral Large 3", + "display_name": "Mistral Large 3", "modalities": { "input": [ "text", @@ -125381,52 +132499,29 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 256000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-10", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "amazon/titan-embed-text-v2", - "name": "Titan Text Embeddings V2", - "display_name": "Titan Text Embeddings V2", + "id": "mistral/devstral-small-2", + "name": "Devstral Small 2", + "display_name": "Devstral Small 2", "modalities": { "input": [ "text" @@ -125436,132 +132531,122 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 256000, + "output": 256000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-04", - "last_updated": "2024-04", - "cost": { - "input": 0.02, - "output": 0 - }, + "knowledge": "2024-10", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "type": "chat" }, { - "id": "amazon/nova-2-lite", - "name": "Nova 2 Lite", - "display_name": "Nova 2 Lite", + "id": "mistral/devstral-small", + "name": "Devstral Small 1.1", + "display_name": "Devstral Small 1.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 128000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0.3, - "output": 2.5 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "amazon/nova-pro", - "name": "Nova Pro", - "display_name": "Nova Pro", + "id": "mistral/ministral-14b", + "name": "Ministral 14B", + "display_name": "Ministral 14B", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 8192 + "context": 256000, + "output": 256000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.8, - "output": 3.2, - "cache_read": 0.2 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "amazon/nova-lite", - "name": "Nova Lite", - "display_name": "Nova Lite", + "id": "mistral/mistral-embed", + "name": "Mistral Embed", + "display_name": "Mistral Embed", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 8192 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "release_date": "2023-12-11", + "last_updated": "2023-12-11", "cost": { - "input": 0.06, - "output": 0.24, - "cache_read": 0.015 + "input": 0.1, + "output": 0 }, "type": "chat" }, { - "id": "amazon/nova-micro", - "name": "Nova Micro", - "display_name": "Nova Micro", + "id": "mistral/magistral-medium", + "name": "Magistral Medium (latest)", + "display_name": "Magistral Medium (latest)", "modalities": { "input": [ "text" @@ -125572,29 +132657,29 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-03-17", + "last_updated": "2025-03-20", "cost": { - "input": 0.035, - "output": 0.14, - "cache_read": 0.00875 + "input": 2, + "output": 5 }, "type": "chat" }, { - "id": "mistral/mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "mistral/ministral-3b", + "name": "Ministral 3B (latest)", + "display_name": "Ministral 3B (latest)", "modalities": { "input": [ "text" @@ -125604,8 +132689,8 @@ ] }, "limit": { - "context": 60288, - "output": 16000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -125613,54 +132698,53 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-04", "cost": { "input": 0.04, - "output": 0.17 + "output": 0.04 }, "type": "chat" }, { - "id": "mistral/ministral-14b", - "name": "Ministral 14B", - "display_name": "Ministral 14B", + "id": "mistral/pixtral-large", + "name": "Pixtral Large (latest)", + "display_name": "Pixtral Large (latest)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2024-11-04", "cost": { - "input": 0.2, - "output": 0.2 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "mistral/codestral-embed", - "name": "Codestral Embed", - "display_name": "Codestral Embed", + "id": "mistral/ministral-8b", + "name": "Ministral 8B (latest)", + "display_name": "Ministral 8B (latest)", "modalities": { "input": [ "text" @@ -125670,39 +132754,39 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 128000, + "output": 128000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-04", "cost": { - "input": 0.15, - "output": 0 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "mistral/mistral-medium", - "name": "Mistral Medium 3.1", - "display_name": "Mistral Medium 3.1", + "id": "mistral/mixtral-8x22b-instruct", + "name": "Mixtral 8x22B", + "display_name": "Mixtral 8x22B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 64000, "output": 64000 }, "temperature": true, @@ -125710,21 +132794,21 @@ "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-04-17", + "last_updated": "2024-04-17", "cost": { - "input": 0.4, - "output": 2 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "mistral/mistral-embed", - "name": "Mistral Embed", - "display_name": "Mistral Embed", + "id": "mistral/magistral-small", + "name": "Magistral Small", + "display_name": "Magistral Small", "modalities": { "input": [ "text" @@ -125734,28 +132818,30 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 128000, + "output": 128000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2023-12-11", - "last_updated": "2023-12-11", + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-03-17", + "last_updated": "2025-03-17", "cost": { - "input": 0.1, - "output": 0 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "mistral/devstral-2", - "name": "Devstral 2", - "display_name": "Devstral 2", + "id": "mistral/codestral", + "name": "Codestral (latest)", + "display_name": "Codestral (latest)", "modalities": { "input": [ "text" @@ -125766,7 +132852,7 @@ }, "limit": { "context": 256000, - "output": 256000 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -125774,16 +132860,20 @@ "supported": false }, "attachment": false, - "open_weights": false, + "open_weights": true, "knowledge": "2024-10", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "release_date": "2024-05-29", + "last_updated": "2025-01-04", + "cost": { + "input": 0.3, + "output": 0.9 + }, "type": "chat" }, { - "id": "mistral/mistral-large-3", - "name": "Mistral Large 3", - "display_name": "Mistral Large 3", + "id": "mistral/pixtral-12b", + "name": "Pixtral 12B", + "display_name": "Pixtral 12B", "modalities": { "input": [ "text", @@ -125794,32 +132884,33 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "open_weights": true, + "knowledge": "2024-09", + "release_date": "2024-09-01", + "last_updated": "2024-09-01", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "mistral/devstral-small-2", - "name": "Devstral Small 2", - "display_name": "Devstral Small 2", + "id": "mistral/mistral-small", + "name": "Mistral Small (latest)", + "display_name": "Mistral Small (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -125831,20 +132922,56 @@ }, "temperature": true, "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", + "cost": { + "input": 0.15, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "morph/morph-v3-fast", + "name": "Morph v3 Fast", + "display_name": "Morph v3 Fast", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16000, + "output": 16000 + }, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", + "cost": { + "input": 0.8, + "output": 1.2 + }, "type": "chat" }, { - "id": "mistral/devstral-small", - "name": "Devstral Small 1.1", - "display_name": "Devstral Small 1.1", + "id": "morph/morph-v3-large", + "name": "Morph v3 Large", + "display_name": "Morph v3 Large", "modalities": { "input": [ "text" @@ -125854,29 +132981,28 @@ ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 32000, + "output": 32000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.9, + "output": 1.9 }, "type": "chat" }, { - "id": "mistral/ministral-8b", - "name": "Ministral 8B (latest)", - "display_name": "Ministral 8B (latest)", + "id": "openai/text-embedding-3-large", + "name": "text-embedding-3-large", + "display_name": "text-embedding-3-large", "modalities": { "input": [ "text" @@ -125886,29 +133012,28 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-04", + "open_weights": false, + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.13, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "mistral/magistral-medium", - "name": "Magistral Medium (latest)", - "display_name": "Magistral Medium (latest)", + "id": "openai/gpt-4o-mini-search-preview", + "name": "GPT 4o Mini Search Preview", + "display_name": "GPT 4o Mini Search Preview", "modalities": { "input": [ "text" @@ -125922,60 +133047,83 @@ "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-03-17", - "last_updated": "2025-03-20", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 2, - "output": 5 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "mistral/mistral-small", - "name": "Mistral Small (latest)", - "display_name": "Mistral Small (latest)", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.15, - "output": 0.6 + "input": 1.75, + "output": 14, + "cache_read": 0.18 }, "type": "chat" }, { - "id": "mistral/magistral-small", - "name": "Magistral Small", - "display_name": "Magistral Small", + "id": "openai/gpt-3.5-turbo", + "name": "GPT-3.5 Turbo", + "display_name": "GPT-3.5 Turbo", "modalities": { "input": [ "text" @@ -125985,20 +133133,19 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 16385, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-03-17", - "last_updated": "2025-03-17", + "open_weights": false, + "knowledge": "2021-09", + "release_date": "2023-03-01", + "last_updated": "2023-03-01", "cost": { "input": 0.5, "output": 1.5 @@ -126006,42 +133153,115 @@ "type": "chat" }, { - "id": "mistral/pixtral-12b", - "name": "Pixtral 12B", - "display_name": "Pixtral 12B", + "id": "openai/o3-pro", + "name": "o3 Pro", + "display_name": "o3 Pro", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "cost": { + "input": 20, + "output": 80 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5.4-nano", + "name": "GPT 5.4 Nano", + "display_name": "GPT 5.4 Nano", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-09-01", - "last_updated": "2024-09-01", + "open_weights": false, + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.19999999999999998, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "mistral/mixtral-8x22b-instruct", - "name": "Mixtral 8x22B", - "display_name": "Mixtral 8x22B", + "id": "openai/text-embedding-ada-002", + "name": "text-embedding-ada-002", + "display_name": "text-embedding-ada-002", "modalities": { "input": [ "text" @@ -126051,126 +133271,179 @@ ] }, "limit": { - "context": 64000, - "output": 64000 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-04-17", - "last_updated": "2024-04-17", + "open_weights": false, + "release_date": "2022-12-15", + "last_updated": "2022-12-15", "cost": { - "input": 2, - "output": 6 + "input": 0.1, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "mistral/pixtral-large", - "name": "Pixtral Large (latest)", - "display_name": "Pixtral Large (latest)", + "id": "openai/gpt-5.5-pro", + "name": "GPT 5.5 Pro", + "display_name": "GPT 5.5 Pro", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 1000000, "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2024-11-04", + "open_weights": false, + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 2, - "output": 6 + "input": 30, + "output": 180 }, "type": "chat" }, { - "id": "mistral/ministral-3b", - "name": "Ministral 3B (latest)", - "display_name": "Ministral 3B (latest)", + "id": "openai/gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex mini", + "display_name": "GPT-5.1 Codex mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 400000, "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-04", + "release_date": "2025-05-16", + "last_updated": "2025-05-16", "cost": { - "input": 0.04, - "output": 0.04 + "input": 0.25, + "output": 2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "mistral/codestral", - "name": "Codestral (latest)", - "display_name": "Codestral (latest)", + "id": "openai/gpt-5.2-pro", + "name": "GPT 5.2 ", + "display_name": "GPT 5.2 ", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, "knowledge": "2024-10", - "release_date": "2024-05-29", - "last_updated": "2025-01-04", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.3, - "output": 0.9 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "meta/llama-3.2-1b", - "name": "Llama 3.2 1B Instruct", - "display_name": "Llama 3.2 1B Instruct", + "id": "openai/gpt-3.5-turbo-instruct", + "name": "GPT-3.5 Turbo Instruct", + "display_name": "GPT-3.5 Turbo Instruct", "modalities": { "input": [ "text" @@ -126180,8 +133453,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 8192, + "output": 4096 }, "temperature": true, "tool_call": false, @@ -126190,19 +133463,19 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2024-09-18", - "last_updated": "2024-09-18", + "knowledge": "2021-09", + "release_date": "2023-03-01", + "last_updated": "2023-03-01", "cost": { - "input": 0.1, - "output": 0.1 + "input": 1.5, + "output": 2 }, "type": "chat" }, { - "id": "meta/llama-3.1-8b", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -126213,61 +133486,68 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.03, - "output": 0.05 + "input": 0.07, + "output": 0.3 }, "type": "chat" }, { - "id": "meta/llama-3.2-90b", - "name": "Llama 3.2 90B Vision Instruct", - "display_name": "Llama 3.2 90B Vision Instruct", + "id": "openai/gpt-oss-safeguard-20b", + "name": "gpt-oss-safeguard-20b", + "display_name": "gpt-oss-safeguard-20b", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.72, - "output": 0.72 + "input": 0.08, + "output": 0.3, + "cache_read": 0.04 }, "type": "chat" }, { - "id": "meta/llama-3.2-3b", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "openai/text-embedding-3-small", + "name": "text-embedding-3-small", + "display_name": "text-embedding-3-small", "modalities": { "input": [ "text" @@ -126277,204 +133557,322 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 8192, + "output": 1536 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2024-09-18", - "last_updated": "2024-09-18", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.02, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "meta/llama-3.2-11b", - "name": "Llama 3.2 11B Vision Instruct", - "display_name": "Llama 3.2 11B Vision Instruct", + "id": "openai/gpt-5-pro", + "name": "GPT-5 pro", + "display_name": "GPT-5 pro", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 400000, + "output": 272000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.16, - "output": 0.16 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "meta/llama-3.1-70b", - "name": "Llama 3.1 70B Instruct", - "display_name": "Llama 3.1 70B Instruct", + "id": "openai/gpt-5.4", + "name": "GPT 5.4", + "display_name": "GPT 5.4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1050000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2026-03-05", + "last_updated": "2026-03-06", "cost": { - "input": 0.4, - "output": 0.4 + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "meta/llama-3.3-70b", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "openai/gpt-5.4-mini", + "name": "GPT 5.4 Mini", + "display_name": "GPT 5.4 Mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": false, + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0, - "output": 0 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "meta/llama-4-maverick", - "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", - "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "id": "openai/gpt-5.1-thinking", + "name": "GPT 5.1 Thinking", + "display_name": "GPT 5.1 Thinking", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "meta/llama-4-scout", - "name": "Llama-4-Scout-17B-16E-Instruct-FP8", - "display_name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "id": "openai/gpt-5.1-instant", + "name": "GPT-5.1 Instant", + "display_name": "GPT-5.1 Instant", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { "context": 128000, - "output": 4096 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "vercel/v0-1.5-md", - "name": "v0-1.5-md", - "display_name": "v0-1.5-md", + "id": "openai/codex-mini", + "name": "Codex Mini", + "display_name": "Codex Mini", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 200000, + "output": 100000 }, "temperature": true, "tool_call": true, @@ -126484,51 +133882,77 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-06-09", - "last_updated": "2025-06-09", + "knowledge": "2024-10", + "release_date": "2025-05-16", + "last_updated": "2025-05-16", "cost": { - "input": 3, - "output": 15 + "input": 1.5, + "output": 6, + "cache_read": 0.38 }, "type": "chat" }, { - "id": "vercel/v0-1.0-md", - "name": "v0-1.0-md", - "display_name": "v0-1.0-md", + "id": "openai/gpt-5.1-codex-max", + "name": "GPT 5.1 Codex Max", + "display_name": "GPT 5.1 Codex Max", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 3, - "output": 15 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "minimax/minimax-m2.7", - "name": "Minimax M2.7", - "display_name": "Minimax M2.7", + "id": "openai/gpt-5.5", + "name": "GPT 5.5", + "display_name": "GPT 5.5", "modalities": { "input": [ "text", @@ -126540,8 +133964,8 @@ ] }, "limit": { - "context": 204800, - "output": 131000 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -126552,42 +133976,52 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": false, + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 5, + "output": 30, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "minimax/minimax-m2.7-highspeed", - "name": "MiniMax M2.7 High Speed", - "display_name": "MiniMax M2.7 High Speed", + "id": "openai/gpt-5.4-pro", + "name": "GPT 5.4 Pro", + "display_name": "GPT 5.4 Pro", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131100 + "context": 1050000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -126598,82 +134032,107 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": false, + "release_date": "2026-03-05", + "last_updated": "2026-03-06", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 30, + "output": 180 }, "type": "chat" }, { - "id": "minimax/minimax-m2", - "name": "MiniMax M2", - "display_name": "MiniMax M2", + "id": "openai/gpt-5.1-codex", + "name": "GPT-5.1-Codex", + "display_name": "GPT-5.1-Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262114, - "output": 262114 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, + "attachment": true, + "open_weights": false, "knowledge": "2024-10", - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.27, - "output": 1.15, - "cache_read": 0.03, - "cache_write": 0.38 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "minimax/minimax-m2.1", - "name": "MiniMax M2.1", - "display_name": "MiniMax M2.1", + "id": "openai/gpt-5.2-codex", + "name": "GPT-5.2-Codex", + "display_name": "GPT-5.2-Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -126684,37 +134143,54 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, "knowledge": "2024-10", - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "release_date": "2025-12", + "last_updated": "2025-12", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.38 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "minimax/minimax-m2.1-lightning", - "name": "MiniMax M2.1 Lightning", - "display_name": "MiniMax M2.1 Lightning", + "id": "openai/gpt-5-chat", + "name": "GPT-5 Chat", + "display_name": "GPT-5 Chat", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -126722,34 +134198,35 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, "knowledge": "2024-10", - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.3, - "output": 2.4, - "cache_read": 0.03, - "cache_write": 0.38 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "openai/gpt-5.3-codex", + "name": "GPT 5.3 Codex", + "display_name": "GPT 5.3 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131000 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -126759,25 +134236,76 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-02-19", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5-highspeed", - "name": "MiniMax M2.5 High Speed", - "display_name": "MiniMax M2.5 High Speed", + "id": "openai/gpt-5.2-chat", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.18 + }, + "type": "chat" + }, + { + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -126787,8 +134315,8 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -126802,61 +134330,83 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-03-13", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 0.1, + "output": 0.5 }, "type": "chat" }, { - "id": "kwaipilot/kat-coder-pro-v1", - "name": "KAT-Coder-Pro V1", - "display_name": "KAT-Coder-Pro V1", + "id": "openai/o3-deep-research", + "name": "o3-deep-research", + "display_name": "o3-deep-research", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, "knowledge": "2024-10", - "release_date": "2025-10-24", - "last_updated": "2025-10-24", + "release_date": "2024-06-26", + "last_updated": "2024-06-26", + "cost": { + "input": 10, + "output": 40, + "cache_read": 2.5 + }, "type": "chat" }, { - "id": "kwaipilot/kat-coder-pro-v2", - "name": "Kat Coder Pro V2", - "display_name": "Kat Coder Pro V2", + "id": "openai/gpt-5.3-chat", + "name": "GPT-5.3 Chat", + "display_name": "GPT-5.3 Chat", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -126864,78 +134414,77 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-30", + "release_date": "2026-03-03", + "last_updated": "2026-03-06", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-lite-preview-09-2025", - "name": "Gemini 2.5 Flash Lite Preview 09-25", - "display_name": "Gemini 2.5 Flash Lite Preview 09-25", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.01 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-lite-preview", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "openai/o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ "text", @@ -126947,10 +134496,10 @@ ] }, "limit": { - "context": 1000000, - "output": 65000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -126958,40 +134507,48 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-03-03", - "last_updated": "2026-03-06", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "google/gemini-3-pro-image", - "name": "Nano Banana Pro (Gemini 3 Pro Image)", - "display_name": "Nano Banana Pro (Gemini 3 Pro Image)", + "id": "openai/o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 65536, - "output": 32768 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -127000,49 +134557,46 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ + "mode": "effort", + "effort": "medium", + "effort_options": [ "low", + "medium", "high" ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "visibility": "hidden" } }, "attachment": false, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-09", - "last_updated": "2025-09", + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 2, - "output": 120 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "google/gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -127052,51 +134606,53 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ "low", + "medium", "high" ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-19", - "last_updated": "2026-02-24", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "google/gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "openai/o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -127106,98 +134662,66 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ + "mode": "effort", + "effort": "medium", + "effort_options": [ "low", + "medium", "high" ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 }, "type": "chat" }, { - "id": "google/imagen-4.0-ultra-generate-001", - "name": "Imagen 4 Ultra", - "display_name": "Imagen 4 Ultra", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ - "text" - ], - "output": [ + "text", "image" - ] - }, - "limit": { - "context": 480, - "output": 8192 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-05-24", - "last_updated": "2025-05-24", - "type": "imageGeneration" - }, - { - "id": "google/gemini-embedding-001", - "name": "Gemini Embedding 001", - "display_name": "Gemini Embedding 001", - "modalities": { - "input": [ - "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 1047576, + "output": 32768 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.15, - "output": 0 + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 }, - "type": "embedding" + "type": "chat" }, { - "id": "google/gemma-4-31b-it", - "name": "Gemma 4 31B IT", - "display_name": "Gemma 4 31B IT", + "id": "openai/o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ "text", @@ -127209,163 +134733,204 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-03", + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 0.14, - "output": 0.39999999999999997 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-image", - "name": "Nano Banana (Gemini 2.5 Flash Image)", - "display_name": "Nano Banana (Gemini 2.5 Flash Image)", + "id": "openai/gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ - "text" - ], - "output": [ "text", "image" + ], + "output": [ + "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-03-20", + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0.3, - "output": 2.5 + "input": 10, + "output": 30 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "google/text-embedding-005", - "name": "Text Embedding 005", - "display_name": "Text Embedding 005", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 128000, + "output": 16384 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-08", - "last_updated": "2024-08", + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.03, - "output": 0 + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "google/text-multilingual-embedding-002", - "name": "Text Multilingual Embedding 002", - "display_name": "Text Multilingual Embedding 002", + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 400000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-03", - "last_updated": "2024-03", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.03, - "output": 0 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-image-preview", - "name": "Gemini 3.1 Flash Image Preview (Nano Banana 2)", - "display_name": "Gemini 3.1 Flash Image Preview (Nano Banana 2)", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 131072, + "context": 1047576, "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-02-26", - "last_updated": "2026-03-06", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.5, - "output": 3 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "google/gemini-3.1-flash-lite", - "name": "Gemini 3.1 Flash Lite", - "display_name": "Gemini 3.1 Flash Lite", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ "text", @@ -127377,50 +134942,44 @@ ] }, "limit": { - "context": 1000000, - "output": 65000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-05-07", - "last_updated": "2026-05-08", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.03 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "google/gemini-3-flash", - "name": "Gemini 3 Flash", - "display_name": "Gemini 3 Flash", + "id": "openai/gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -127430,123 +134989,108 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ + "mode": "effort", + "effort": "medium", + "effort_options": [ "minimal", "low", "medium", "high" ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "google/imagen-4.0-generate-001", - "name": "Imagen 4", - "display_name": "Imagen 4", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 128000, + "output": 16384 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "type": "imageGeneration" + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", + "cost": { + "input": 2.5, + "output": 10, + "cache_read": 1.25 + }, + "type": "chat" }, { - "id": "google/gemini-2.5-flash-preview-09-2025", - "name": "Gemini 2.5 Flash Preview 09-25", - "display_name": "Gemini 2.5 Flash Preview 09-25", + "id": "amazon/nova-2-lite", + "name": "Nova 2 Lite", + "display_name": "Nova 2 Lite", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 1000000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { "input": 0.3, - "output": 2.5, - "cache_read": 0.03, - "cache_write": 0.383 + "output": 2.5 }, "type": "chat" }, { - "id": "google/gemini-embedding-2", - "name": "Gemini Embedding 2", - "display_name": "Gemini Embedding 2", + "id": "amazon/titan-embed-text-v2", + "name": "Titan Text Embeddings V2", + "display_name": "Titan Text Embeddings V2", "modalities": { "input": [ "text" @@ -127557,225 +135101,195 @@ }, "limit": { "context": 8192, - "output": 8192 + "output": 1536 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-03-10", - "last_updated": "2026-03-23", + "release_date": "2024-04", + "last_updated": "2024-04", + "cost": { + "input": 0.02, + "output": 0 + }, "type": "chat" }, { - "id": "google/gemma-4-26b-a4b-it", - "name": "Gemma 4 26B A4B IT", - "display_name": "Gemma 4 26B A4B IT", + "id": "amazon/nova-lite", + "name": "Nova Lite", + "display_name": "Nova Lite", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 300000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-03", + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.13, - "output": 0.39999999999999997 + "input": 0.06, + "output": 0.24, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "google/imagen-4.0-fast-generate-001", - "name": "Imagen 4 Fast", - "display_name": "Imagen 4 Fast", + "id": "amazon/nova-micro", + "name": "Nova Micro", + "display_name": "Nova Micro", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, + "context": 128000, "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-06", - "last_updated": "2025-06", - "type": "imageGeneration" + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", + "cost": { + "input": 0.035, + "output": 0.14, + "cache_read": 0.00875 + }, + "type": "chat" }, { - "id": "google/gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "amazon/nova-pro", + "name": "Nova Pro", + "display_name": "Nova Pro", "modalities": { "input": [ "text", "image", - "audio", - "video", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 300000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.01 + "input": 0.8, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-image-preview", - "name": "Nano Banana Preview (Gemini 2.5 Flash Image Preview)", - "display_name": "Nano Banana Preview (Gemini 2.5 Flash Image Preview)", + "id": "recraft/recraft-v2", + "name": "Recraft V2", + "display_name": "Recraft V2", "modalities": { "input": [ "text" ], "output": [ - "text", "image" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 512, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-03-20", - "cost": { - "input": 0.3, - "output": 2.5 - }, - "type": "imageGeneration" + "release_date": "2024-03", + "last_updated": "2024-03", + "type": "chat" }, { - "id": "google/gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash Lite", - "display_name": "Gemini 2.0 Flash Lite", + "id": "recraft/recraft-v3", + "name": "Recraft V3", + "display_name": "Recraft V3", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 1048576, + "context": 512, "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", - "cost": { - "input": 0.075, - "output": 0.3 - }, + "release_date": "2024-10", + "last_updated": "2024-10", "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "minimax/minimax-m2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -127786,55 +135300,38 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "interleaved": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2024-10", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { "input": 0.3, - "output": 2.5, + "output": 1.2, "cache_read": 0.03, - "input_audio": 1 + "cache_write": 0.38 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "minimax/minimax-m2.7-highspeed", + "name": "MiniMax M2.7 High Speed", + "display_name": "MiniMax M2.7 High Speed", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 204800, + "output": 131100 }, "temperature": true, "tool_call": true, @@ -127845,80 +135342,106 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 + }, + "type": "chat" + }, + { + "id": "minimax/minimax-m2", + "name": "MiniMax M2", + "display_name": "MiniMax M2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262114, + "output": 262114 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true } }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "cost": { + "input": 0.27, + "output": 1.15, + "cache_read": 0.03, + "cache_write": 0.38 + }, "type": "chat" }, { - "id": "google/gemini-2.0-flash", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "minimax/minimax-m2.1-lightning", + "name": "MiniMax M2.1 Lightning", + "display_name": "MiniMax M2.1 Lightning", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2024-10", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.3, + "output": 2.4, + "cache_read": 0.03, + "cache_write": 0.38 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-turbo", - "name": "Kimi K2 Turbo", - "display_name": "Kimi K2 Turbo", + "id": "minimax/minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -127928,42 +135451,49 @@ ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 204800, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "release_date": "2026-02-12", + "last_updated": "2026-02-19", "cost": { - "input": 2.4, - "output": 10 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "minimax/minimax-m2.7", + "name": "Minimax M2.7", + "display_name": "Minimax M2.7", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -127984,19 +135514,20 @@ }, "attachment": true, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-26", - "last_updated": "2026-01-26", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.6, - "output": 1.2 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking-turbo", - "name": "Kimi K2 Thinking Turbo", - "display_name": "Kimi K2 Thinking Turbo", + "id": "minimax/minimax-m2.5-highspeed", + "name": "MiniMax M2.5 High Speed", + "display_name": "MiniMax M2.5 High Speed", "modalities": { "input": [ "text" @@ -128006,8 +135537,8 @@ ] }, "limit": { - "context": 262114, - "output": 262114 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -128017,26 +135548,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true + "supported": true } }, "attachment": false, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "release_date": "2026-02-12", + "last_updated": "2026-03-13", "cost": { - "input": 1.15, - "output": 8, - "cache_read": 0.15 + "input": 0.6, + "output": 2.4, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "kwaipilot/kat-coder-pro-v2", + "name": "Kat Coder Pro V2", + "display_name": "Kat Coder Pro V2", "modalities": { "input": [ "text" @@ -128046,42 +135576,71 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 256000, + "output": 256000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "release_date": "2026-03-27", + "last_updated": "2026-03-30", "cost": { - "input": 0.6, - "output": 2.5 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "kwaipilot/kat-coder-pro-v1", + "name": "KAT-Coder-Pro V1", + "display_name": "KAT-Coder-Pro V1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 32000 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-10-24", + "last_updated": "2025-10-24", + "type": "chat" + }, + { + "id": "nvidia/nemotron-nano-12b-v2-vl", + "name": "Nvidia Nemotron Nano 12B V2 VL", + "display_name": "Nvidia Nemotron Nano 12B V2 VL", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -128089,26 +135648,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-20", - "last_updated": "2026-04-24", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12", + "last_updated": "2024-12", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "nvidia/nemotron-3-super-120b-a12b", + "name": "NVIDIA Nemotron 3 Super 120B A12B", + "display_name": "NVIDIA Nemotron 3 Super 120B A12B", "modalities": { "input": [ "text" @@ -128118,42 +135672,28 @@ ] }, "limit": { - "context": 216144, - "output": 216144 + "context": 256000, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "release_date": "2026-03-18", + "last_updated": "2026-03-30", "cost": { - "input": 0.47, - "output": 2, - "cache_read": 0.14 + "input": 0.15, + "output": 0.65 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "nvidia/nemotron-nano-9b-v2", + "name": "Nvidia Nemotron Nano 9B V2", + "display_name": "Nvidia Nemotron Nano 9B V2", "modalities": { "input": [ "text" @@ -128164,28 +135704,29 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, + "open_weights": false, "knowledge": "2024-10", - "release_date": "2025-07-14", - "last_updated": "2025-07-14", + "release_date": "2025-08-18", + "last_updated": "2025-08-18", "cost": { - "input": 1, - "output": 3 + "input": 0.04, + "output": 0.16 }, "type": "chat" }, - { - "id": "interfaze/interfaze-beta", - "name": "Interfaze Beta", - "display_name": "Interfaze Beta", + { + "id": "nvidia/nemotron-3-nano-30b-a3b", + "name": "Nemotron 3 Nano 30B A3B", + "display_name": "Nemotron 3 Nano 30B A3B", "modalities": { "input": [ "text" @@ -128195,8 +135736,8 @@ ] }, "limit": { - "context": 1000000, - "output": 32000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": false, @@ -128206,18 +135747,19 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-10-07", - "last_updated": "2026-04-29", + "knowledge": "2024-10", + "release_date": "2024-12", + "last_updated": "2024-12", "cost": { - "input": 1.5, - "output": 3.5 + "input": 0.06, + "output": 0.24 }, "type": "chat" }, { - "id": "anthropic/claude-3.5-sonnet-20240620", - "name": "Claude 3.5 Sonnet (2024-06-20)", - "display_name": "Claude 3.5 Sonnet (2024-06-20)", + "id": "anthropic/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", @@ -128229,22 +135771,69 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-06-20", - "last_updated": "2024-06-20", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { "input": 3, - "output": 15 + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5 + } }, "type": "chat" }, @@ -128312,9 +135901,9 @@ "type": "chat" }, { - "id": "anthropic/claude-opus-4.7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "anthropic/claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", @@ -128326,48 +135915,31 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] + "interleaved": true } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, @@ -128415,9 +135987,9 @@ "type": "chat" }, { - "id": "anthropic/claude-haiku-4.5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "anthropic/claude-3.5-sonnet-20240620", + "name": "Claude 3.5 Sonnet (2024-06-20)", + "display_name": "Claude 3.5 Sonnet (2024-06-20)", "modalities": { "input": [ "text", @@ -128430,37 +136002,28 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2024-04", + "release_date": "2024-06-20", + "last_updated": "2024-06-20", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "anthropic/claude-opus-4.7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", @@ -128475,7 +136038,7 @@ "context": 1000000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -128485,51 +136048,42 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", + "mode": "effort", + "effort": "high", "effort_options": [ "low", "medium", - "high" + "high", + "xhigh" ], "interleaved": true, "summaries": true, - "visibility": "summary", "continuation": [ "thinking_blocks" ], "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5 - } + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "anthropic/claude-3-opus", - "name": "Claude Opus 3", - "display_name": "Claude Opus 3", + "id": "anthropic/claude-3.5-haiku", + "name": "Claude Haiku 3.5", + "display_name": "Claude Haiku 3.5", "modalities": { "input": [ "text", @@ -128542,7 +136096,7 @@ }, "limit": { "context": 200000, - "output": 4096 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -128551,21 +136105,21 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "anthropic/claude-3.5-haiku", - "name": "Claude Haiku 3.5", - "display_name": "Claude Haiku 3.5", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ "text", @@ -128578,7 +136132,44 @@ }, "limit": { "context": 200000, - "output": 8192 + "output": 64000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "type": "chat" + }, + { + "id": "anthropic/claude-3-opus", + "name": "Claude Opus 3", + "display_name": "Claude Opus 3", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -128587,14 +136178,14 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2023-08-31", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, @@ -128636,9 +136227,9 @@ "type": "chat" }, { - "id": "anthropic/claude-3-haiku", - "name": "Claude Haiku 3", - "display_name": "Claude Haiku 3", + "id": "anthropic/claude-opus-4.1", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ "text", @@ -128651,30 +136242,31 @@ }, "limit": { "context": 200000, - "output": 4096 + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-13", - "last_updated": "2024-03-13", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "anthropic/claude-3.5-sonnet", + "name": "Claude Sonnet 3.5 v2", + "display_name": "Claude Sonnet 3.5 v2", "modalities": { "input": [ "text", @@ -128687,19 +136279,18 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { "input": 3, "output": 15, @@ -128709,9 +136300,9 @@ "type": "chat" }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "anthropic/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", @@ -128734,9 +136325,9 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { "input": 3, "output": 15, @@ -128746,9 +136337,9 @@ "type": "chat" }, { - "id": "anthropic/claude-3.5-sonnet", - "name": "Claude Sonnet 3.5 v2", - "display_name": "Claude Sonnet 3.5 v2", + "id": "anthropic/claude-3-haiku", + "name": "Claude Haiku 3", + "display_name": "Claude Haiku 3", "modalities": { "input": [ "text", @@ -128761,7 +136352,7 @@ }, "limit": { "context": 200000, - "output": 8192 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -128770,14 +136361,14 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 }, "type": "chat" }, @@ -128839,9 +136430,9 @@ "type": "chat" }, { - "id": "anthropic/claude-opus-4.1", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "google/gemma-4-26b-a4b-it", + "name": "Gemma 4 26B A4B IT", + "display_name": "Gemma 4 26B A4B IT", "modalities": { "input": [ "text", @@ -128853,8 +136444,8 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -128864,32 +136455,31 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2026-04-02", + "last_updated": "2026-04-03", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.13, + "output": 0.39999999999999997 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2.5-pro", - "name": "MiMo V2.5 Pro", - "display_name": "MiMo V2.5 Pro", + "id": "google/gemini-3.1-flash-lite", + "name": "Gemini 3.1 Flash Lite", + "display_name": "Gemini 3.1 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 131000 + "context": 1000000, + "output": 65000 }, "temperature": true, "tool_call": true, @@ -128897,35 +136487,41 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-04-22", - "last_updated": "2026-05-01", + "release_date": "2026-05-07", + "last_updated": "2026-05-08", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.19999999999999998 + "input": 0.25, + "output": 1.5, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2.5", - "name": "MiMo M2.5", - "display_name": "MiMo M2.5", + "id": "google/gemini-2.5-flash-preview-09-2025", + "name": "Gemini 2.5 Flash Preview 09-25", + "display_name": "Gemini 2.5 Flash Preview 09-25", "modalities": { "input": [ "text", "image", "audio", - "video" + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 131100 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -128933,32 +136529,110 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-04-22", - "last_updated": "2026-05-01", + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.39999999999999997, - "output": 2, - "cache_read": 0.08 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "cache_write": 0.383 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-pro", - "name": "MiMo V2 Pro", - "display_name": "MiMo V2 Pro", + "id": "google/imagen-4.0-fast-generate-001", + "name": "Imagen 4 Fast", + "display_name": "Imagen 4 Fast", "modalities": { "input": [ "text" ], "output": [ + "image" + ] + }, + "limit": { + "context": 480, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-06", + "last_updated": "2025-06", + "type": "imageGeneration" + }, + { + "id": "google/imagen-4.0-generate-001", + "name": "Imagen 4", + "display_name": "Imagen 4", + "modalities": { + "input": [ "text" + ], + "output": [ + "image" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 480, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "type": "imageGeneration" + }, + { + "id": "google/gemma-4-31b-it", + "name": "Gemma 4 31B IT", + "display_name": "Gemma 4 31B IT", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -128966,65 +136640,188 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-18", - "last_updated": "2026-03-20", + "release_date": "2026-04-02", + "last_updated": "2026-04-03", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.19999999999999998 + "input": 0.14, + "output": 0.39999999999999997 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash", - "name": "MiMo V2 Flash", - "display_name": "MiMo V2 Flash", + "id": "google/gemini-3.1-flash-image-preview", + "name": "Gemini 3.1 Flash Image Preview (Nano Banana 2)", + "display_name": "Gemini 3.1 Flash Image Preview (Nano Banana 2)", "modalities": { "input": [ - "text" + "text", + "image" + ], + "output": [ + "text", + "image" + ] + }, + "limit": { + "context": 131072, + "output": 32768 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-26", + "last_updated": "2026-03-06", + "cost": { + "input": 0.5, + "output": 3 + }, + "type": "imageGeneration" + }, + { + "id": "google/gemini-2.5-flash-lite-preview-09-2025", + "name": "Gemini 2.5 Flash Lite Preview 09-25", + "display_name": "Gemini 2.5 Flash Lite Preview 09-25", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { "input": 0.1, - "output": 0.29 + "output": 0.4, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "bytedance/seed-1.6", - "name": "Seed 1.6", - "display_name": "Seed 1.6", + "id": "google/gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.01 + }, + "type": "chat" + }, + { + "id": "google/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -129032,33 +136829,145 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "cost": { + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } + }, + "type": "chat" + }, + { + "id": "google/gemini-embedding-2", + "name": "Gemini Embedding 2", + "display_name": "Gemini Embedding 2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", + "release_date": "2026-03-10", + "last_updated": "2026-03-23", + "type": "chat" + }, + { + "id": "google/gemini-3-pro-image", + "name": "Nano Banana Pro (Gemini 3 Pro Image)", + "display_name": "Nano Banana Pro (Gemini 3 Pro Image)", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text", + "image" + ] + }, + "limit": { + "context": 65536, + "output": 32768 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-03", "release_date": "2025-09", "last_updated": "2025-09", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.05 + "input": 2, + "output": 120 }, "type": "chat" }, { - "id": "bytedance/seed-1.8", - "name": "Seed 1.8", - "display_name": "Seed 1.8", + "id": "google/gemini-3-flash", + "name": "Gemini 3 Flash", + "display_name": "Gemini 3 Flash", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 1000000, "output": 64000 }, "temperature": true, @@ -129067,50 +136976,258 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-10", - "last_updated": "2025-10", + "knowledge": "2025-03", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.25, - "output": 2, + "input": 0.5, + "output": 3, "cache_read": 0.05 }, "type": "chat" }, { - "id": "meituan/longcat-flash-chat", - "name": "LongCat Flash Chat", - "display_name": "LongCat Flash Chat", + "id": "google/gemini-2.5-flash-image-preview", + "name": "Nano Banana Preview (Gemini 2.5 Flash Image Preview)", + "display_name": "Nano Banana Preview (Gemini 2.5 Flash Image Preview)", "modalities": { "input": [ "text" ], + "output": [ + "text", + "image" + ] + }, + "limit": { + "context": 32768, + "output": 32768 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-03-20", + "cost": { + "input": 0.3, + "output": 2.5 + }, + "type": "imageGeneration" + }, + { + "id": "google/gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 1000000, + "output": 65000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-03-03", + "last_updated": "2026-03-06", + "cost": { + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "cache_write": 1 + }, + "type": "chat" + }, + { + "id": "google/gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-19", + "last_updated": "2026-02-24", + "cost": { + "input": 2, + "output": 12, + "cache_read": 0.2 + }, + "type": "chat" + }, + { + "id": "google/imagen-4.0-ultra-generate-001", + "name": "Imagen 4 Ultra", + "display_name": "Imagen 4 Ultra", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 480, "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-05-24", + "last_updated": "2025-05-24", + "type": "imageGeneration" + }, + { + "id": "google/gemini-2.5-flash-image", + "name": "Nano Banana (Gemini 2.5 Flash Image)", + "display_name": "Nano Banana (Gemini 2.5 Flash Image)", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text", + "image" + ] + }, + "limit": { + "context": 32768, + "output": 32768 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-03-20", + "cost": { + "input": 0.3, + "output": 2.5 + }, + "type": "imageGeneration" + }, + { + "id": "google/gemini-embedding-001", + "name": "Gemini Embedding 001", + "display_name": "Gemini Embedding 001", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 1536 + }, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-30", - "last_updated": "2025-08-30", - "type": "chat" + "release_date": "2025-05-20", + "last_updated": "2025-05-20", + "cost": { + "input": 0.15, + "output": 0 + }, + "type": "embedding" }, { - "id": "meituan/longcat-flash-thinking", - "name": "LongCat Flash Thinking", - "display_name": "LongCat Flash Thinking", + "id": "google/text-multilingual-embedding-002", + "name": "Text Multilingual Embedding 002", + "display_name": "Text Multilingual Embedding 002", "modalities": { "input": [ "text" @@ -129120,30 +137237,28 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "release_date": "2024-03", + "last_updated": "2024-03", "cost": { - "input": 0.15, - "output": 1.5 + "input": 0.03, + "output": 0 }, "type": "chat" }, { - "id": "meituan/longcat-flash-thinking-2601", - "name": "LongCat Flash Thinking 2601", - "display_name": "LongCat Flash Thinking 2601", + "id": "google/text-embedding-005", + "name": "Text Embedding 005", + "display_name": "Text Embedding 005", "modalities": { "input": [ "text" @@ -129153,180 +137268,278 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 8192, + "output": 1536 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-03-13", - "last_updated": "2026-03-13", + "release_date": "2024-08", + "last_updated": "2024-08", + "cost": { + "input": 0.03, + "output": 0 + }, "type": "chat" }, { - "id": "bfl/flux-pro-1.0-fill", - "name": "FLUX.1 Fill [pro]", - "display_name": "FLUX.1 Fill [pro]", + "id": "google/gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 512, + "context": 1048576, "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-10", - "last_updated": "2024-10", + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + }, "type": "chat" }, { - "id": "bfl/flux-pro-1.1", - "name": "FLUX1.1 [pro]", - "display_name": "FLUX1.1 [pro]", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 512, - "output": 8192 + "context": 1048576, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-10", - "last_updated": "2024-10", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 + }, "type": "chat" }, { - "id": "bfl/flux-kontext-pro", - "name": "FLUX.1 Kontext Pro", - "display_name": "FLUX.1 Kontext Pro", + "id": "google/gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "display_name": "Gemini 2.0 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 512, + "context": 1048576, "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-06", - "last_updated": "2025-06", + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "cost": { + "input": 0.075, + "output": 0.3 + }, "type": "chat" }, { - "id": "bfl/flux-kontext-max", - "name": "FLUX.1 Kontext Max", - "display_name": "FLUX.1 Kontext Max", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 512, - "output": 8192 + "context": 1048576, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-06", - "last_updated": "2025-06", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + } + }, "type": "chat" }, { - "id": "bfl/flux-pro-1.1-ultra", - "name": "FLUX1.1 [pro] Ultra", - "display_name": "FLUX1.1 [pro] Ultra", + "id": "vercel/v0-1.0-md", + "name": "v0-1.0-md", + "display_name": "v0-1.0-md", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 512, - "output": 8192 + "context": 128000, + "output": 32000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-11", - "last_updated": "2024-11", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 3, + "output": 15 + }, "type": "chat" - } - ] - }, - "minimax": { - "id": "minimax", - "name": "MiniMax (minimax.io)", - "display_name": "MiniMax (minimax.io)", - "api": "https://api.minimax.io/anthropic/v1", - "doc": "https://platform.minimax.io/docs/guides/quickstart", - "models": [ + }, { - "id": "MiniMax-M2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "vercel/v0-1.5-md", + "name": "v0-1.5-md", + "display_name": "v0-1.5-md", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 128000 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -129334,25 +137547,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "attachment": true, + "open_weights": false, + "release_date": "2025-06-09", + "last_updated": "2025-06-09", "cost": { - "input": 0.3, - "output": 1.2 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "deepseek/deepseek-v3.2-exp", + "name": "DeepSeek V3.2 Exp", + "display_name": "DeepSeek V3.2 Exp", "modalities": { "input": [ "text" @@ -129362,8 +137570,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, @@ -129371,27 +137579,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "knowledge": "2025-09", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 0.27, + "output": 0.4 }, "type": "chat" }, { - "id": "MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "deepseek/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -129401,8 +137603,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -129423,20 +137625,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2026-04-23", + "last_updated": "2026-04-24", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "MiniMax-M2.7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "deepseek/deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -129446,42 +137647,35 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 163842, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0.27, + "output": 0.4, + "cache_read": 0.22 }, "type": "chat" }, { - "id": "MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "deepseek/deepseek-v3", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ "text" @@ -129491,34 +137685,29 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 163840, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-12-26", + "last_updated": "2024-12-26", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.77, + "output": 0.77 }, "type": "chat" }, { - "id": "MiniMax-M2.5-highspeed", - "name": "MiniMax-M2.5-highspeed", - "display_name": "MiniMax-M2.5-highspeed", + "id": "deepseek/deepseek-v3.2-thinking", + "name": "DeepSeek V3.2 Thinking", + "display_name": "DeepSeek V3.2 Thinking", "modalities": { "input": [ "text" @@ -129528,8 +137717,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -129539,78 +137728,70 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-13", - "last_updated": "2026-02-13", + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0.28, + "output": 0.42, + "cache_read": 0.03 }, "type": "chat" - } - ] - }, - "llmgateway": { - "id": "llmgateway", - "name": "LLM Gateway", - "display_name": "LLM Gateway", - "api": "https://api.llmgateway.io/v1", - "doc": "https://llmgateway.io/docs", - "models": [ + }, { - "id": "gpt-4o-mini-search-preview", - "name": "GPT-4o Mini Search Preview", - "display_name": "GPT-4o Mini Search Preview", + "id": "deepseek/deepseek-v3.1", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 163840, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "knowledge": "2024-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.3, + "output": 1 }, "type": "chat" }, { - "id": "grok-4-1-fast-reasoning", - "name": "Grok 4.1 Fast Reasoning", - "display_name": "Grok 4.1 Fast Reasoning", + "id": "deepseek/deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -129620,24 +137801,30 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-23", + "last_updated": "2026-04-24", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct (2507)", - "display_name": "Qwen3 235B A22B Instruct (2507)", + "id": "deepseek/deepseek-v3.1-terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ "text" @@ -129648,27 +137835,29 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-07-08", - "last_updated": "2025-07-08", + "knowledge": "2025-07", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 0.8, - "output": 2.4 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "llama-4-scout", - "name": "Llama 4 Scout", - "display_name": "Llama 4 Scout", + "id": "deepseek/deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -129678,28 +137867,41 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", "cost": { - "input": 0.18, - "output": 0.59 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "hermes-2-pro-llama-3-8b", - "name": "Hermes 2 Pro Llama 3 8B", - "display_name": "Hermes 2 Pro Llama 3 8B", + "id": "perplexity/sonar-reasoning", + "name": "Sonar Reasoning", + "display_name": "Sonar Reasoning", "modalities": { "input": [ "text" @@ -129709,91 +137911,96 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 127000, + "output": 8000 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2024-05-27", - "last_updated": "2024-05-27", + "open_weights": false, + "knowledge": "2025-09", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.14, - "output": 0.14 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "qwen-coder-plus", - "name": "Qwen Coder Plus", - "display_name": "Qwen Coder Plus", + "id": "perplexity/sonar", + "name": "Sonar", + "display_name": "Sonar", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 127000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2024-09-18", + "knowledge": "2025-02", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.5, + "input": 1, "output": 1 }, "type": "chat" }, { - "id": "auto", - "name": "Auto Route", - "display_name": "Auto Route", + "id": "perplexity/sonar-reasoning-pro", + "name": "Sonar Reasoning Pro", + "display_name": "Sonar Reasoning Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 127000, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "knowledge": "2025-09", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0, - "output": 0 + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "glm-4.6v-flashx", - "name": "GLM-4.6V FlashX", - "display_name": "GLM-4.6V FlashX", + "id": "perplexity/sonar-pro", + "name": "Sonar Pro", + "display_name": "Sonar Pro", "modalities": { "input": [ "text", @@ -129804,30 +138011,29 @@ ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 200000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "knowledge": "2025-09", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.04, - "output": 0.4, - "cache_read": 0 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "gemma-2-27b-it-together", - "name": "Gemma 2 27B IT", - "display_name": "Gemma 2 27B IT", + "id": "arcee-ai/trinity-mini", + "name": "Trinity Mini", + "display_name": "Trinity Mini", "modalities": { "input": [ "text" @@ -129837,8 +138043,8 @@ ] }, "limit": { - "context": 8192, - "output": 16384 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": false, @@ -129846,19 +138052,20 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-06-27", - "last_updated": "2024-06-27", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-12", + "last_updated": "2025-12", "cost": { - "input": 0.08, - "output": 0.08 + "input": 0.05, + "output": 0.15 }, "type": "chat" }, { - "id": "codestral-2508", - "name": "Codestral", - "display_name": "Codestral", + "id": "arcee-ai/trinity-large-thinking", + "name": "Trinity Large Thinking", + "display_name": "Trinity Large Thinking", "modalities": { "input": [ "text" @@ -129868,28 +138075,29 @@ ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 262100, + "output": 80000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "release_date": "2026-04-01", + "last_updated": "2026-04-03", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.25, + "output": 0.8999999999999999 }, "type": "chat" }, { - "id": "gemma-3-1b-it", - "name": "Gemma 3 1B IT", - "display_name": "Gemma 3 1B IT", + "id": "arcee-ai/trinity-large-preview", + "name": "Trinity Large Preview", + "display_name": "Trinity Large Preview", "modalities": { "input": [ "text" @@ -129899,28 +138107,29 @@ ] }, "limit": { - "context": 1000000, - "output": 16384 + "context": 131000, + "output": 131000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-03-12", - "last_updated": "2025-03-12", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 0.08, - "output": 0.3 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "glm-4-32b-0414-128k", - "name": "GLM-4 32B (0414-128k)", - "display_name": "GLM-4 32B (0414-128k)", + "id": "alibaba/qwen3-max-preview", + "name": "Qwen3 Max Preview", + "display_name": "Qwen3 Max Preview", "modalities": { "input": [ "text" @@ -129930,40 +138139,54 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.1, - "output": 0.1 + "input": 1.2, + "output": 6, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "seed-1-6-flash-250715", - "name": "Seed 1.6 Flash (250715)", - "display_name": "Seed 1.6 Flash (250715)", + "id": "alibaba/qwen3.5-plus", + "name": "Qwen 3.5 Plus", + "display_name": "Qwen 3.5 Plus", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -129971,21 +138194,33 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": true, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "open_weights": false, + "release_date": "2026-02-16", + "last_updated": "2026-02-19", "cost": { - "input": 0.07, - "output": 0.3, - "cache_read": 0.01 + "input": 0.4, + "output": 2.4, + "cache_read": 0.04, + "cache_write": 0.5 }, "type": "chat" }, { - "id": "seed-1-6-250615", - "name": "Seed 1.6 (250615)", - "display_name": "Seed 1.6 (250615)", + "id": "alibaba/qwen3-vl-235b-a22b-instruct", + "name": "Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen3 VL 235B A22B Instruct", "modalities": { "input": [ "text", @@ -129996,42 +138231,41 @@ ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 131072, + "output": 129024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-06-25", - "last_updated": "2025-06-25", + "open_weights": false, + "release_date": "2025-09-24", + "last_updated": "2026-05-01", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.05 + "input": 0.39999999999999997, + "output": 1.5999999999999999 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b-thinking", - "name": "Qwen3 VL 235B A22B Thinking", - "display_name": "Qwen3 VL 235B A22B Thinking", + "id": "alibaba/qwen3.6-27b", + "name": "Qwen 3.6 27B", + "display_name": "Qwen 3.6 27B", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -130051,19 +138285,19 @@ } }, "attachment": true, - "open_weights": true, - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "open_weights": false, + "release_date": "2026-04-22", + "last_updated": "2026-05-01", "cost": { - "input": 0.8, - "output": 2.4 + "input": 0.6, + "output": 3.5999999999999996 }, "type": "chat" }, { - "id": "qwen3-vl-30b-a3b-thinking", - "name": "Qwen3 VL 30B A3B Thinking", - "display_name": "Qwen3 VL 30B A3B Thinking", + "id": "alibaba/qwen3-vl-thinking", + "name": "Qwen3 VL Thinking", + "display_name": "Qwen3 VL Thinking", "modalities": { "input": [ "text", @@ -130075,7 +138309,7 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 129024 }, "temperature": true, "tool_call": true, @@ -130096,82 +138330,84 @@ }, "attachment": true, "open_weights": true, - "release_date": "2025-10-02", - "last_updated": "2025-10-02", + "knowledge": "2025-09", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.7, + "output": 8.4 }, "type": "chat" }, { - "id": "qwen2-5-vl-32b-instruct", - "name": "Qwen2.5 VL 32B Instruct", - "display_name": "Qwen2.5 VL 32B Instruct", + "id": "alibaba/qwen-3-235b", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 40960, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-03-15", - "last_updated": "2025-03-15", + "attachment": false, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.3, - "output": 0.3 + "input": 0.13, + "output": 0.6 }, "type": "chat" }, { - "id": "qwen3-vl-8b-instruct", - "name": "Qwen3 VL 8B Instruct", - "display_name": "Qwen3 VL 8B Instruct", + "id": "alibaba/qwen-3-32b", + "name": "Qwen 3.32B", + "display_name": "Qwen 3.32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 40960, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-08-19", - "last_updated": "2025-08-19", + "attachment": false, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { "input": 0.1, - "output": 0.1 + "output": 0.3 }, "type": "chat" }, { - "id": "claude-3-7-sonnet", - "name": "Claude 3.7 Sonnet", - "display_name": "Claude 3.7 Sonnet", + "id": "alibaba/qwen3-max-thinking", + "name": "Qwen 3 Max Thinking", + "display_name": "Qwen 3 Max Thinking", "modalities": { "input": [ "text" @@ -130181,62 +138417,96 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-01", + "last_updated": "2025-01", + "cost": { + "input": 1.2, + "output": 6, + "cache_read": 0.24 + }, + "type": "chat" + }, + { + "id": "alibaba/qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" ] } }, "attachment": false, "open_weights": false, - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3 + "input": 1.2, + "output": 6 }, "type": "chat" }, { - "id": "gemini-pro-latest", - "name": "Gemini Pro Latest", - "display_name": "Gemini Pro Latest", + "id": "alibaba/qwen3-coder-next", + "name": "Qwen3 Coder Next", + "display_name": "Qwen3 Coder Next", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -130244,21 +138514,20 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-02-27", - "last_updated": "2026-02-27", + "release_date": "2025-07-22", + "last_updated": "2026-02-19", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2 + "input": 0.5, + "output": 1.2 }, "type": "chat" }, { - "id": "claude-3-5-haiku", - "name": "Claude 3.5 Haiku", - "display_name": "Claude 3.5 Haiku", + "id": "alibaba/qwen3-embedding-0.6b", + "name": "Qwen3 Embedding 0.6B", + "display_name": "Qwen3 Embedding 0.6B", "modalities": { "input": [ "text" @@ -130268,33 +138537,31 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 32768, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08 + "input": 0.01, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "qwen-max-latest", - "name": "Qwen Max Latest", - "display_name": "Qwen Max Latest", + "id": "alibaba/qwen3-embedding-8b", + "name": "Qwen3 Embedding 8B", + "display_name": "Qwen3 Embedding 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -130302,91 +138569,106 @@ }, "limit": { "context": 32768, - "output": 8192 + "output": 32768 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-01-25", - "last_updated": "2025-01-25", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "cost": { - "input": 1.6, - "output": 6.4 + "input": 0.05, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "glm-4.6v-flash", - "name": "GLM-4.6V Flash", - "display_name": "GLM-4.6V Flash", + "id": "alibaba/qwen3-coder", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 262144, + "output": 66536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "attachment": false, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0, - "output": 0 + "input": 0.38, + "output": 1.53 }, "type": "chat" }, { - "id": "qwen3-30b-a3b-instruct-2507", - "name": "Qwen3 30B A3B Instruct (2507)", - "display_name": "Qwen3 30B A3B Instruct (2507)", + "id": "alibaba/qwen3.6-plus", + "name": "Qwen 3.6 Plus", + "display_name": "Qwen 3.6 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-08", - "last_updated": "2025-07-08", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-04-02", + "last_updated": "2026-04-03", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.5, + "output": 3, + "cache_read": 0.09999999999999999, + "cache_write": 0.625 }, "type": "chat" }, { - "id": "minimax-text-01", - "name": "MiniMax Text 01", - "display_name": "MiniMax Text 01", + "id": "alibaba/qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ "text" @@ -130396,29 +138678,41 @@ ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 131072, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-01-15", - "last_updated": "2025-01-15", + "knowledge": "2025-09", + "release_date": "2025-09-12", + "last_updated": "2025-09-12", "cost": { - "input": 0.2, - "output": 1.1 + "input": 0.15, + "output": 1.5 }, "type": "chat" }, { - "id": "qwen3-32b-fp8", - "name": "Qwen3 32B FP8", - "display_name": "Qwen3 32B FP8", + "id": "alibaba/qwen-3-14b", + "name": "Qwen3-14B", + "display_name": "Qwen3-14B", "modalities": { "input": [ "text" @@ -130428,8 +138722,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 40960, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -130438,62 +138732,66 @@ "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.06, + "output": 0.24 }, "type": "chat" }, { - "id": "llama-4-scout-17b-instruct", - "name": "Llama 4 Scout 17B Instruct", - "display_name": "Llama 4 Scout 17B Instruct", + "id": "alibaba/qwen-3-30b", + "name": "Qwen3-30B-A3B", + "display_name": "Qwen3-30B-A3B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 40960, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "attachment": false, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.17, - "output": 0.66 + "input": 0.08, + "output": 0.29 }, "type": "chat" }, { - "id": "qwen3-4b-fp8", - "name": "Qwen3 4B FP8", - "display_name": "Qwen3 4B FP8", + "id": "alibaba/qwen3.5-flash", + "name": "Qwen 3.5 Flash", + "display_name": "Qwen 3.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -130501,20 +138799,33 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0.03, - "output": 0.05 + "input": 0.1, + "output": 0.4, + "cache_read": 0.001, + "cache_write": 0.125 }, "type": "chat" }, { - "id": "ministral-8b-2512", - "name": "Ministral 8B", - "display_name": "Ministral 8B", + "id": "alibaba/qwen3-vl-instruct", + "name": "Qwen3 VL Instruct", + "display_name": "Qwen3 VL Instruct", "modalities": { "input": [ "text", @@ -130525,104 +138836,93 @@ ] }, "limit": { - "context": 262144, - "output": 8192 + "context": 131072, + "output": 129024 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "knowledge": "2025-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.7, + "output": 2.8 }, "type": "chat" }, { - "id": "gemma-3-27b", - "name": "Gemma 3 27B", - "display_name": "Gemma 3 27B", + "id": "alibaba/qwen3-embedding-4b", + "name": "Qwen3 Embedding 4B", + "display_name": "Qwen3 Embedding 4B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-03-12", - "last_updated": "2025-03-12", + "attachment": false, + "open_weights": false, + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "cost": { - "input": 0.27, - "output": 0.27 + "input": 0.02, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "qwen3-vl-flash", - "name": "Qwen3 VL Flash", - "display_name": "Qwen3 VL Flash", + "id": "alibaba/qwen3-coder-30b-a3b", + "name": "Qwen 3 Coder 30B A3B Instruct", + "display_name": "Qwen 3 Coder 30B A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32000 + "context": 160000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-09", - "last_updated": "2025-10-09", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 + "input": 0.07, + "output": 0.27 }, "type": "chat" }, { - "id": "llama-3.1-70b-instruct", - "name": "Llama 3.1 70B Instruct", - "display_name": "Llama 3.1 70B Instruct", + "id": "alibaba/qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ "text" @@ -130632,40 +138932,42 @@ ] }, "limit": { - "context": 128000, - "output": 2048 + "context": 262144, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2025-04", + "release_date": "2025-09-12", + "last_updated": "2025-09-12", "cost": { - "input": 0.72, - "output": 0.72 + "input": 0.09, + "output": 1.1 }, "type": "chat" }, { - "id": "seed-1-8-251228", - "name": "Seed 1.8 (251228)", - "display_name": "Seed 1.8 (251228)", + "id": "alibaba/qwen-3.6-max-preview", + "name": "Qwen 3.6 Max Preview", + "display_name": "Qwen 3.6 Max Preview", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 240000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -130675,30 +138977,33 @@ }, "attachment": true, "open_weights": true, - "release_date": "2025-12-18", - "last_updated": "2025-12-18", + "release_date": "2026-04-20", + "last_updated": "2026-04-24", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.05 + "input": 1.3, + "output": 7.8, + "cache_read": 0.26, + "cache_write": 1.625 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen3 235B A22B Thinking (2507)", - "display_name": "Qwen3 235B A22B Thinking (2507)", + "id": "alibaba/qwen3-235b-a22b-thinking", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262114, + "output": 262114 }, "temperature": true, "tool_call": true, @@ -130717,32 +139022,66 @@ ] } }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", + "cost": { + "input": 0.3, + "output": 2.9 + }, + "type": "chat" + }, + { + "id": "alibaba/qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 1000000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, "attachment": false, "open_weights": true, - "release_date": "2025-07-08", - "last_updated": "2025-07-08", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.8, - "output": 2.4 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "seed-1-6-250915", - "name": "Seed 1.6 (250915)", - "display_name": "Seed 1.6 (250915)", + "id": "xai/grok-4.20-reasoning", + "name": "Grok 4.20 Reasoning", + "display_name": "Grok 4.20 Reasoning", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, @@ -130751,20 +139090,20 @@ "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "open_weights": false, + "release_date": "2026-03-09", + "last_updated": "2026-03-23", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.05 + "input": 2, + "output": 6, + "cache_read": 0.19999999999999998 }, "type": "chat" }, { - "id": "glm-4.5-x", - "name": "GLM-4.5 X", - "display_name": "GLM-4.5 X", + "id": "xai/grok-4.1-fast-reasoning", + "name": "Grok 4.1 Fast Reasoning", + "display_name": "Grok 4.1 Fast Reasoning", "modalities": { "input": [ "text" @@ -130774,8 +139113,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -130785,66 +139124,57 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2024-10", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 2.2, - "output": 8.9, - "cache_read": 0.45 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "qwen3-30b-a3b-thinking-2507", - "name": "Qwen3 30B A3B Thinking (2507)", - "display_name": "Qwen3 30B A3B Thinking (2507)", + "id": "xai/grok-4.20-non-reasoning", + "name": "Grok 4.20 Non-Reasoning", + "display_name": "Grok 4.20 Non-Reasoning", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-08", - "last_updated": "2025-07-08", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-09", + "last_updated": "2026-03-23", "cost": { - "input": 0.1, - "output": 0.1 + "input": 2, + "output": 6, + "cache_read": 0.19999999999999998 }, "type": "chat" }, { - "id": "grok-4-fast-reasoning", - "name": "Grok 4 Fast Reasoning", - "display_name": "Grok 4 Fast Reasoning", + "id": "xai/grok-4.1-fast-non-reasoning", + "name": "Grok 4.1 Fast Non-Reasoning", + "display_name": "Grok 4.1 Fast Non-Reasoning", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -130857,16 +139187,11 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, + "knowledge": "2024-10", "release_date": "2025-07-09", "last_updated": "2025-07-09", "cost": { @@ -130877,21 +139202,20 @@ "type": "chat" }, { - "id": "deepseek-v3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "xai/grok-4.20-multi-agent", + "name": "Grok 4.20 Multi-Agent", + "display_name": "Grok 4.20 Multi-Agent", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, @@ -130899,190 +139223,186 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "attachment": false, + "open_weights": false, + "release_date": "2026-03-09", + "last_updated": "2026-03-23", "cost": { - "input": 0.56, - "output": 1.68, - "cache_read": 0.11 + "input": 2, + "output": 6, + "cache_read": 0.19999999999999998 }, "type": "chat" }, { - "id": "ministral-3b-2512", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "xai/grok-4.20-non-reasoning-beta", + "name": "Grok 4.20 Beta Non-Reasoning", + "display_name": "Grok 4.20 Beta Non-Reasoning", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 2000000, + "output": 2000000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "open_weights": false, + "release_date": "2026-03-11", + "last_updated": "2026-03-13", "cost": { - "input": 0.1, - "output": 0.1 + "input": 2, + "output": 6, + "cache_read": 0.19999999999999998 }, "type": "chat" }, { - "id": "qwen-plus-latest", - "name": "Qwen Plus Latest", - "display_name": "Qwen Plus Latest", + "id": "xai/grok-imagine-image", + "name": "Grok Imagine Image", + "display_name": "Grok Imagine Image", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 131072, + "context": 8192, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-01-25", - "last_updated": "2025-01-25", - "cost": { - "input": 0.3, - "output": 0.9 - }, + "release_date": "2026-01-28", + "last_updated": "2026-02-19", "type": "chat" }, { - "id": "llama-3.1-nemotron-ultra-253b", - "name": "Llama 3.1 Nemotron Ultra 253B", - "display_name": "Llama 3.1 Nemotron Ultra 253B", + "id": "xai/grok-4.3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 1000000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-07", - "last_updated": "2025-04-07", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-04-30", + "last_updated": "2026-05-01", "cost": { - "input": 0.6, - "output": 1.8 + "input": 1.25, + "output": 2.5, + "cache_read": 0.19999999999999998 }, "type": "chat" }, { - "id": "llama-4-maverick-17b-instruct", - "name": "Llama 4 Maverick 17B Instruct", - "display_name": "Llama 4 Maverick 17B Instruct", + "id": "xai/grok-4.20-reasoning-beta", + "name": "Grok 4.20 Beta Reasoning", + "display_name": "Grok 4.20 Beta Reasoning", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 2000000, + "output": 2000000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "release_date": "2026-03-11", + "last_updated": "2026-03-13", "cost": { - "input": 0.24, - "output": 0.97 + "input": 2, + "output": 6, + "cache_read": 0.19999999999999998 }, "type": "chat" }, { - "id": "grok-4-0709", - "name": "Grok 4 (0709)", - "display_name": "Grok 4 (0709)", + "id": "xai/grok-imagine-image-pro", + "name": "Grok Imagine Image Pro", + "display_name": "Grok Imagine Image Pro", "modalities": { "input": [ "text" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", - "cost": { - "input": 3, - "output": 15 - }, + "release_date": "2026-01-28", + "last_updated": "2026-02-19", "type": "chat" }, { - "id": "qwen3-30b-a3b-fp8", - "name": "Qwen3 30B A3B FP8", - "display_name": "Qwen3 30B A3B FP8", + "id": "xai/grok-4.20-multi-agent-beta", + "name": "Grok 4.20 Multi Agent Beta", + "display_name": "Grok 4.20 Multi Agent Beta", "modalities": { "input": [ "text" @@ -131092,8 +139412,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, @@ -131102,19 +139422,20 @@ "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "open_weights": false, + "release_date": "2026-03-11", + "last_updated": "2026-03-13", "cost": { - "input": 0.1, - "output": 0.1 + "input": 2, + "output": 6, + "cache_read": 0.19999999999999998 }, "type": "chat" }, { - "id": "minimax-m2.1-lightning", - "name": "MiniMax M2.1 Lightning", - "display_name": "MiniMax M2.1 Lightning", + "id": "xai/grok-4-fast-reasoning", + "name": "Grok 4 Fast Reasoning", + "display_name": "Grok 4 Fast Reasoning", "modalities": { "input": [ "text" @@ -131124,29 +139445,36 @@ ] }, "limit": { - "context": 196608, - "output": 131072 + "context": 2000000, + "output": 256000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.12, - "output": 0.48 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "qwen3-max-2026-01-23", - "name": "Qwen3 Max (2026-01-23)", - "display_name": "Qwen3 Max (2026-01-23)", + "id": "xai/grok-2-vision", + "name": "Grok 2 Vision", + "display_name": "Grok 2 Vision", "modalities": { "input": [ "text", @@ -131157,41 +139485,30 @@ ] }, "limit": { - "context": 256000, - "output": 32800 + "context": 8192, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-01-23", - "last_updated": "2026-01-23", + "knowledge": "2024-08", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.6 + "input": 2, + "output": 10, + "cache_read": 2 }, "type": "chat" }, { - "id": "llama-3.2-3b-instruct", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "interfaze/interfaze-beta", + "name": "Interfaze Beta", + "display_name": "Interfaze Beta", "modalities": { "input": [ "text" @@ -131201,28 +139518,29 @@ ] }, "limit": { - "context": 32768, + "context": 1000000, "output": 32000 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2024-09-18", - "last_updated": "2024-09-18", + "open_weights": false, + "release_date": "2025-10-07", + "last_updated": "2026-04-29", "cost": { - "input": 0.03, - "output": 0.05 + "input": 1.5, + "output": 3.5 }, "type": "chat" }, { - "id": "qwen3-coder-next", - "name": "Qwen3 Coder Next", - "display_name": "Qwen3 Coder Next", + "id": "meituan/longcat-flash-chat", + "name": "LongCat Flash Chat", + "display_name": "LongCat Flash Chat", "modalities": { "input": [ "text" @@ -131232,33 +139550,28 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", - "cost": { - "input": 0.8, - "output": 4 - }, + "knowledge": "2024-10", + "release_date": "2025-08-30", + "last_updated": "2025-08-30", "type": "chat" }, { - "id": "gpt-4o-search-preview", - "name": "GPT-4o Search Preview", - "display_name": "GPT-4o Search Preview", + "id": "meituan/longcat-flash-thinking", + "name": "LongCat Flash Thinking", + "display_name": "LongCat Flash Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -131266,63 +139579,60 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "knowledge": "2024-10", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 2.5, - "output": 10 + "input": 0.15, + "output": 1.5 }, "type": "chat" }, { - "id": "custom", - "name": "Custom Model", - "display_name": "Custom Model", + "id": "meituan/longcat-flash-thinking-2601", + "name": "LongCat Flash Thinking 2601", + "display_name": "LongCat Flash Thinking 2601", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2026-03-13", + "last_updated": "2026-03-13", "type": "chat" }, { - "id": "qwen3-vl-30b-a3b-instruct", - "name": "Qwen3 VL 30B A3B Instruct", - "display_name": "Qwen3 VL 30B A3B Instruct", + "id": "meta/llama-3.1-70b", + "name": "Llama 3.1 70B Instruct", + "display_name": "Llama 3.1 70B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -131330,98 +139640,93 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-10-02", - "last_updated": "2025-10-02", + "attachment": false, + "open_weights": false, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "meta/llama-3.1-8b", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 163840, + "context": 131072, "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": false, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.28, - "output": 0.42, - "cache_read": 0.03 + "input": 0.03, + "output": 0.05 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-fp8", - "name": "Qwen3 235B A22B FP8", - "display_name": "Qwen3 235B A22B FP8", + "id": "meta/llama-3.2-90b", + "name": "Llama 3.2 90B Vision Instruct", + "display_name": "Llama 3.2 90B Vision Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "attachment": true, + "open_weights": false, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.5, - "output": 2.5 + "input": 0.72, + "output": 0.72 }, "type": "chat" - }, - { - "id": "gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + }, + { + "id": "meta/llama-3.2-3b", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ "text" @@ -131431,34 +139736,29 @@ ] }, "limit": { - "context": 131072, - "output": 32766 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2023-12", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 0.1, - "output": 0.5 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "kimi-k2", - "name": "Kimi K2", - "display_name": "Kimi K2", + "id": "meta/llama-3.2-1b", + "name": "Llama 3.2 1B Instruct", + "display_name": "Llama 3.2 1B Instruct", "modalities": { "input": [ "text" @@ -131468,60 +139768,62 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "open_weights": false, + "knowledge": "2023-12", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.5 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "llama-3-8b-instruct", - "name": "Llama 3 8B Instruct", - "display_name": "Llama 3 8B Instruct", + "id": "meta/llama-3.2-11b", + "name": "Llama 3.2 11B Vision Instruct", + "display_name": "Llama 3.2 11B Vision Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, + "context": 128000, "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-03", - "last_updated": "2025-04-03", + "attachment": true, + "open_weights": false, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.04, - "output": 0.04 + "input": 0.16, + "output": 0.16 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b-instruct", - "name": "Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen3 VL 235B A22B Instruct", + "id": "meta/llama-4-maverick", + "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", "modalities": { "input": [ "text", @@ -131532,8 +139834,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -131542,55 +139844,52 @@ }, "attachment": true, "open_weights": true, - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.8, - "output": 2.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "meta/llama-4-scout", + "name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "display_name": "Llama-4-Scout-17B-16E-Instruct-FP8", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32766 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.15, - "output": 0.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen25-coder-7b", - "name": "Qwen2.5 Coder 7B", - "display_name": "Qwen2.5 Coder 7B", + "id": "meta/llama-3.3-70b", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -131600,28 +139899,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2024-09-19", - "last_updated": "2024-09-19", + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.05, - "output": 0.05 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "xiaomi/mimo-v2.5-pro", + "name": "MiMo V2.5 Pro", + "display_name": "MiMo V2.5 Pro", "modalities": { "input": [ "text" @@ -131631,28 +139931,30 @@ ] }, "limit": { - "context": 128000, - "output": 2048 + "context": 1050000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-22", + "last_updated": "2026-05-01", "cost": { - "input": 0.22, - "output": 0.22 + "input": 1, + "output": 3, + "cache_read": 0.19999999999999998 }, "type": "chat" }, { - "id": "llama-3-70b-instruct", - "name": "Llama 3 70B Instruct", - "display_name": "Llama 3 70B Instruct", + "id": "xiaomi/mimo-v2-flash", + "name": "MiMo V2 Flash", + "display_name": "MiMo V2 Flash", "modalities": { "input": [ "text" @@ -131662,28 +139964,30 @@ ] }, "limit": { - "context": 8192, - "output": 8000 + "context": 262144, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.51, - "output": 0.74 + "input": 0.1, + "output": 0.29 }, "type": "chat" }, { - "id": "deepseek-r1-0528", - "name": "DeepSeek R1 (0528)", - "display_name": "DeepSeek R1 (0528)", + "id": "xiaomi/mimo-v2-pro", + "name": "MiMo V2 Pro", + "display_name": "MiMo V2 Pro", "modalities": { "input": [ "text" @@ -131693,72 +139997,75 @@ ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 1000000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": false, + "release_date": "2026-03-18", + "last_updated": "2026-03-20", "cost": { - "input": 0.8, - "output": 2.4 + "input": 1, + "output": 3, + "cache_read": 0.19999999999999998 }, "type": "chat" }, { - "id": "glm-4.5-airx", - "name": "GLM-4.5 AirX", - "display_name": "GLM-4.5 AirX", + "id": "xiaomi/mimo-v2.5", + "name": "MiMo M2.5", + "display_name": "MiMo M2.5", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1050000, + "output": 131100 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2026-04-22", + "last_updated": "2026-05-01", "cost": { - "input": 1.1, - "output": 4.5, - "cache_read": 0.22 + "input": 0.39999999999999997, + "output": 2, + "cache_read": 0.08 }, "type": "chat" - }, + } + ] + }, + "abliteration-ai": { + "id": "abliteration-ai", + "name": "abliteration.ai", + "display_name": "abliteration.ai", + "api": "https://api.abliteration.ai/v1", + "doc": "https://docs.abliteration.ai/models", + "models": [ { - "id": "ministral-14b-2512", - "name": "Ministral 14B", - "display_name": "Ministral 14B", + "id": "abliterated-model", + "name": "Abliterated Model", + "display_name": "Abliterated Model", "modalities": { "input": [ "text", @@ -131769,28 +140076,37 @@ ] }, "limit": { - "context": 262144, + "context": 150000, "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "release_date": "2026-01-06", + "last_updated": "2026-01-06", "cost": { - "input": 0.2, - "output": 0.2 + "input": 3, + "output": 3 }, "type": "chat" - }, + } + ] + }, + "deepseek": { + "id": "deepseek", + "name": "DeepSeek", + "display_name": "DeepSeek", + "api": "https://api.deepseek.com", + "doc": "https://api-docs.deepseek.com/zh-cn/quick_start/pricing", + "models": [ { - "id": "llama-3.2-11b-instruct", - "name": "Llama 3.2 11B Instruct", - "display_name": "Llama 3.2 11B Instruct", + "id": "deepseek-chat", + "name": "DeepSeek Chat", + "display_name": "DeepSeek Chat", "modalities": { "input": [ "text" @@ -131800,61 +140116,84 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1048576, + "output": 393216 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2025-09", + "release_date": "2024-12-26", + "last_updated": "2026-04-24", "cost": { - "input": 0.07, - "output": 0.33 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "claude-3-opus", - "name": "Claude 3 Opus", - "display_name": "Claude 3 Opus", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Thinking mode is controlled through the thinking parameter; non-thinking mode disables reasoning." + ] + } }, "attachment": true, - "open_weights": false, - "release_date": "2024-03-04", - "last_updated": "2024-03-04", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5 + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "minimax-m2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "deepseek-reasoner", + "name": "DeepSeek Reasoner", + "display_name": "DeepSeek Reasoner", "modalities": { "input": [ "text" @@ -131864,10 +140203,10 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1048576, + "output": 393216 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -131876,68 +140215,101 @@ "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Compatibility alias for deepseek-v4-flash thinking mode." ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-09", + "release_date": "2025-01-20", + "last_updated": "2026-04-24", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "grok-4-20-beta-0309-non-reasoning", - "name": "Grok 4.20 (Non-Reasoning)", - "display_name": "Grok 4.20 (Non-Reasoning)", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Thinking mode is controlled through the thinking parameter; non-thinking mode disables reasoning." + ] + } }, "attachment": true, - "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-09", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 12, - "cache_read": 0.4 - } + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" - }, + } + ] + }, + "perplexity": { + "id": "perplexity", + "name": "Perplexity", + "display_name": "Perplexity", + "doc": "https://docs.perplexity.ai", + "models": [ { - "id": "qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "sonar", + "name": "Sonar", + "display_name": "Sonar", "modalities": { "input": [ "text" @@ -131947,184 +140319,155 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { "input": 1, - "output": 5 + "output": 1 }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5 (latest)", - "display_name": "Claude Haiku 4.5 (latest)", + "id": "sonar-deep-research", + "name": "Perplexity Sonar Deep Research", + "display_name": "Perplexity Sonar Deep Research", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2025-01", + "release_date": "2025-02-01", + "last_updated": "2025-09-01", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 2, + "output": 8, + "reasoning": 3 }, "type": "chat" }, { - "id": "claude-opus-4-5-20251101", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "sonar-reasoning-pro", + "name": "Sonar Reasoning Pro", + "display_name": "Sonar Reasoning Pro", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-09-2025", - "name": "Gemini 2.5 Flash Lite Preview 09-25", - "display_name": "Gemini 2.5 Flash Lite Preview 09-25", + "id": "sonar-pro", + "name": "Sonar Pro", + "display_name": "Sonar Pro", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 3, + "output": 15 }, "type": "chat" - }, + } + ] + }, + "iflowcn": { + "id": "iflowcn", + "name": "iFlow", + "display_name": "iFlow", + "api": "https://apis.iflow.cn/v1", + "doc": "https://platform.iflow.cn/en/docs", + "models": [ { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "qwen3-max-preview", + "name": "Qwen3-Max-Preview", + "display_name": "Qwen3-Max-Preview", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -132138,21 +140481,20 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "kimi-k2-0905", + "name": "Kimi-K2-0905", + "display_name": "Kimi-K2-0905", "modalities": { "input": [ "text" @@ -132162,19 +140504,19 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "attachment": false, + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { "input": 0, "output": 0 @@ -132182,9 +140524,9 @@ "type": "chat" }, { - "id": "mistral-large-2512", - "name": "Mistral Large 3", - "display_name": "Mistral Large 3", + "id": "qwen3-vl-plus", + "name": "Qwen3-VL-Plus", + "display_name": "Qwen3-VL-Plus", "modalities": { "input": [ "text", @@ -132195,29 +140537,40 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2025-12-02", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "qwen3-235b", + "name": "Qwen3-235B-A22B", + "display_name": "Qwen3-235B-A22B", "modalities": { "input": [ "text" @@ -132227,8 +140580,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -132236,34 +140589,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "minimax-m2.7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -132273,8 +140613,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -132295,20 +140635,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2024-12", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mimo-v2.5-pro", - "name": "MiMo-V2.5-Pro", - "display_name": "MiMo-V2.5-Pro", + "id": "deepseek-v3.2", + "name": "DeepSeek-V3.2-Exp", + "display_name": "DeepSeek-V3.2-Exp", "modalities": { "input": [ "text" @@ -132318,47 +140657,34 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2, - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gemma-3n-e4b-it", - "name": "Gemma 3n 4B", - "display_name": "Gemma 3n 4B", + "id": "deepseek-v3", + "name": "DeepSeek-V3", + "display_name": "DeepSeek-V3", "modalities": { "input": [ "text" @@ -132368,19 +140694,19 @@ ] }, "limit": { - "context": 8192, - "output": 2000 + "context": 128000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, "knowledge": "2024-10", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "release_date": "2024-12-26", + "last_updated": "2024-12-26", "cost": { "input": 0, "output": 0 @@ -132388,59 +140714,65 @@ "type": "chat" }, { - "id": "claude-3-5-sonnet-20241022", - "name": "Claude Sonnet 3.5 v2", - "display_name": "Claude Sonnet 3.5 v2", + "id": "qwen3-max", + "name": "Qwen3-Max", + "display_name": "Qwen3-Max", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.2-pro", - "name": "GPT-5.2 Pro", - "display_name": "GPT-5.2 Pro", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 200000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -132448,39 +140780,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2025-11-13", "cost": { - "input": 21, - "output": 168 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwq-plus", - "name": "QwQ Plus", - "display_name": "QwQ Plus", + "id": "qwen3-32b", + "name": "Qwen3-32B", + "display_name": "Qwen3-32B", "modalities": { "input": [ "text" @@ -132490,14 +140807,13 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -132511,35 +140827,31 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-03-05", - "last_updated": "2025-03-05", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.8, - "output": 2.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gemini-3.1-flash-lite-preview", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen3-235B-A22B-Thinking", + "display_name": "Qwen3-235B-A22B-Thinking", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -132549,38 +140861,41 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen-vl-plus", - "name": "Qwen-VL Plus", - "display_name": "Qwen-VL Plus", + "id": "kimi-k2", + "name": "Kimi-K2", + "display_name": "Kimi-K2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -132589,19 +140904,19 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", - "last_updated": "2025-08-15", + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.21, - "output": 0.63 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "qwen3-coder-plus", + "name": "Qwen3-Coder-Plus", + "display_name": "Qwen3-Coder-Plus", "modalities": { "input": [ "text" @@ -132611,42 +140926,29 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "knowledge": "2025-04", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2, - "cache_write": 0 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "devstral-2512", - "name": "Devstral 2", - "display_name": "Devstral 2", + "id": "qwen3-235b-a22b-instruct", + "name": "Qwen3-235B-A22B-Instruct", + "display_name": "Qwen3-235B-A22B-Instruct", "modalities": { "input": [ "text" @@ -132656,8 +140958,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -132666,19 +140968,28 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "knowledge": "2025-04", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.4, - "output": 2 + "input": 0, + "output": 0 }, "type": "chat" - }, + } + ] + }, + "stackit": { + "id": "stackit", + "name": "STACKIT", + "display_name": "STACKIT", + "api": "https://api.openai-compat.model-serving.eu01.onstackit.cloud/v1", + "doc": "https://docs.stackit.cloud/products/data-and-ai/ai-model-serving/basics/available-shared-models", + "models": [ { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "neuralmagic/Meta-Llama-3.1-8B-Instruct-FP8", + "name": "Llama 3.1 8B", + "display_name": "Llama 3.1 8B", "modalities": { "input": [ "text" @@ -132688,105 +140999,59 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.7, - "output": 2.8, - "reasoning": 8.4 + "input": 0.16, + "output": 0.27 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "neuralmagic/Mistral-Nemo-Instruct-2407-FP8", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.49, + "output": 0.71 }, "type": "chat" }, { - "id": "glm-4.7-flashx", - "name": "GLM-4.7-FlashX", - "display_name": "GLM-4.7-FlashX", + "id": "cortecs/Llama-3.3-70B-Instruct-FP8-Dynamic", + "name": "Llama 3.3 70B", + "display_name": "Llama 3.3 70B", "modalities": { "input": [ "text" @@ -132796,47 +141061,39 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 0.07, - "output": 0.4, - "cache_read": 0.01, - "cache_write": 0 + "input": 0.49, + "output": 0.71 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS 120B", + "display_name": "GPT-OSS 120B", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -132846,77 +141103,55 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.49, + "output": 0.71 }, "type": "chat" }, { - "id": "qwen35-397b-a17b", - "name": "Qwen3.5 397B-A17B", - "display_name": "Qwen3.5 397B-A17B", + "id": "google/gemma-3-27b-it", + "name": "Gemma 3 27B", + "display_name": "Gemma 3 27B", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 37000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": true, - "release_date": "2026-02-15", - "last_updated": "2026-02-15", + "release_date": "2025-05-17", + "last_updated": "2025-05-17", "cost": { - "input": 0.6, - "output": 3.6 + "input": 0.49, + "output": 0.71 }, "type": "chat" }, { - "id": "qwen-max", - "name": "Qwen Max", - "display_name": "Qwen Max", + "id": "intfloat/e5-mistral-7b-instruct", + "name": "E5 Mistral 7B", + "display_name": "E5 Mistral 7B", "modalities": { "input": [ "text" @@ -132926,29 +141161,28 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 4096, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-04-03", - "last_updated": "2025-01-25", + "open_weights": true, + "release_date": "2023-12-11", + "last_updated": "2023-12-11", "cost": { - "input": 1.6, - "output": 6.4 + "input": 0.02, + "output": 0.02 }, "type": "chat" }, { - "id": "gpt-5.3-chat-latest", - "name": "GPT-5.3 Chat (latest)", - "display_name": "GPT-5.3 Chat (latest)", + "id": "Qwen/Qwen3-VL-235B-A22B-Instruct-FP8", + "name": "Qwen3-VL 235B", + "display_name": "Qwen3-VL 235B", "modalities": { "input": [ "text", @@ -132959,8 +141193,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 218000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -132968,75 +141202,74 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "open_weights": true, + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 1.64, + "output": 1.91 }, "type": "chat" }, { - "id": "gemini-2.0-flash", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "Qwen/Qwen3-VL-Embedding-8B", + "name": "Qwen3-VL Embedding 8B", + "display_name": "Qwen3-VL Embedding 8B", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 32000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": true, + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.09, + "output": 0.09 }, "type": "chat" - }, + } + ] + }, + "evroc": { + "id": "evroc", + "name": "evroc", + "display_name": "evroc", + "api": "https://models.think.evroc.com/v1", + "doc": "https://docs.evroc.com/products/think/overview.html", + "models": [ { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", "image", - "video", - "audio", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 262144 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -133045,103 +141278,71 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "attachment": false, + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "context_over_200k": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 - } + "input": 1.47, + "output": 5.9 }, "type": "chat" }, { - "id": "qwen-plus", - "name": "Qwen Plus", - "display_name": "Qwen Plus", + "id": "openai/whisper-large-v3", + "name": "Whisper 3 Large", + "display_name": "Whisper 3 Large", "modalities": { "input": [ - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 448, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", - "last_updated": "2025-09-11", + "open_weights": true, + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 0.4, - "output": 1.2, - "reasoning": 4 + "input": 0.00236, + "output": 0.00236, + "output_audio": 2.36 }, "type": "chat" }, { - "id": "gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 65536, + "output": 65536 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -133149,51 +141350,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 0.24, + "output": 0.94 }, "type": "chat" }, { - "id": "qwen3.6-35b-a3b", - "name": "Qwen3.6 35B-A3B", - "display_name": "Qwen3.6 35B-A3B", + "id": "KBLab/kb-whisper-large", + "name": "KB Whisper", + "display_name": "KB Whisper", "modalities": { "input": [ - "text", - "image", - "video", "audio" ], "output": [ @@ -133201,195 +141376,150 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 448, + "output": 448 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2024-10-01", + "last_updated": "2024-10-01", + "cost": { + "input": 0.00236, + "output": 0.00236, + "output_audio": 2.36 }, - "attachment": true, + "type": "chat" + }, + { + "id": "nvidia/Llama-3.3-70B-Instruct-FP8", + "name": "Llama 3.3 70B", + "display_name": "Llama 3.3 70B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 32768 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": true, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.248, - "output": 1.485 + "input": 1.18, + "output": 1.18 }, "type": "chat" }, { - "id": "qwen-omni-turbo", - "name": "Qwen-Omni Turbo", - "display_name": "Qwen-Omni Turbo", + "id": "mistralai/Voxtral-Small-24B-2507", + "name": "Voxtral Small 24B", + "display_name": "Voxtral Small 24B", "modalities": { "input": [ - "text", - "image", "audio", - "video" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 32000, + "output": 32000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-19", - "last_updated": "2025-03-26", + "open_weights": true, + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 0.07, - "output": 0.27, - "input_audio": 4.44, - "output_audio": 8.89 + "input": 0.00236, + "output": 0.00236, + "output_audio": 2.36 }, "type": "chat" }, { - "id": "claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "mistralai/devstral-small-2-24b-instruct-2512", + "name": "Devstral Small 2 24B Instruct 2512", + "display_name": "Devstral Small 2 24B Instruct 2512", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 32768, + "output": 32768 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.12, + "output": 0.47 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "mistralai/Magistral-Small-2509", + "name": "Magistral Small 1.2 24B", + "display_name": "Magistral Small 1.2 24B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 131072 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.59, + "output": 2.36 }, "type": "chat" }, { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "microsoft/Phi-4-multimodal-instruct", + "name": "Phi-4 15B", + "display_name": "Phi-4 15B", "modalities": { "input": [ "text", @@ -133400,158 +141530,89 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32000, + "output": 32000 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 0.24, + "output": 0.47 }, "type": "chat" }, { - "id": "mimo-v2-omni", - "name": "MiMo-V2-Omni", - "display_name": "MiMo-V2-Omni", + "id": "intfloat/multilingual-e5-large-instruct", + "name": "E5 Multi-Lingual Large Embeddings 0.6B", + "display_name": "E5 Multi-Lingual Large Embeddings 0.6B", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 512, + "output": 512 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": false, + "open_weights": true, + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08 + "input": 0.12, + "output": 0.12 }, "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "name": "Qwen3 VL 30B", + "display_name": "Qwen3 VL 30B", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 100000, + "output": 100000 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.24, + "output": 0.94 }, "type": "chat" }, { - "id": "minimax-m2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507-FP8", + "name": "Qwen3 30B 2507", + "display_name": "Qwen3 30B 2507", "modalities": { "input": [ "text" @@ -133561,38 +141622,71 @@ ] }, "limit": { - "context": 196608, - "output": 128000 + "context": 64000, + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.35, + "output": 1.42 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "Qwen/Qwen3-Embedding-8B", + "name": "Qwen3 Embedding 8B", + "display_name": "Qwen3 Embedding 8B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 40960, + "output": 40960 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-07-30", + "last_updated": "2025-07-30", + "cost": { + "input": 0.12, + "output": 0.12 + }, + "type": "embedding" + } + ] + }, + "nova": { + "id": "nova", + "name": "Nova", + "display_name": "Nova", + "api": "https://api.nova.amazon.com/v1", + "doc": "https://nova.amazon.com/dev/documentation", + "models": [ + { + "id": "nova-2-pro-v1", + "name": "Nova 2 Pro", + "display_name": "Nova 2 Pro", "modalities": { "input": [ "text", "image", + "video", "pdf" ], "output": [ @@ -133600,7 +141694,7 @@ ] }, "limit": { - "context": 200000, + "context": 1000000, "output": 64000 }, "temperature": true, @@ -133611,24 +141705,25 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-12-03", + "last_updated": "2026-01-03", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0, + "reasoning": 0 }, "type": "chat" }, { - "id": "qwen-flash", - "name": "Qwen Flash", - "display_name": "Qwen Flash", + "id": "nova-2-lite-v1", + "name": "Nova 2 Lite", + "display_name": "Nova 2 Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "pdf" ], "output": [ "text" @@ -133636,7 +141731,7 @@ }, "limit": { "context": 1000000, - "output": 32768 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -133644,147 +141739,111 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.05, - "output": 0.4 + "input": 0, + "output": 0, + "reasoning": 0 }, "type": "chat" - }, + } + ] + }, + "venice": { + "id": "venice", + "name": "Venice AI", + "display_name": "Venice AI", + "doc": "https://docs.venice.ai", + "models": [ { - "id": "gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "z-ai-glm-5-turbo", + "name": "GLM 5 Turbo", + "display_name": "GLM 5 Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-15", + "last_updated": "2026-04-12", "cost": { - "input": 10, - "output": 30 + "input": 1.2, + "output": 4, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "hermes-3-llama-3.1-405b", + "name": "Hermes 3 Llama 3.1 405b", + "display_name": "Hermes 3 Llama 3.1 405b", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "context": 128000, + "output": 16384 }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2025-09-25", + "last_updated": "2026-03-12", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 1.1, + "output": 3 }, "type": "chat" }, { - "id": "mimo-v2.5", - "name": "MiMo-V2.5", - "display_name": "MiMo-V2.5", + "id": "qwen3-vl-235b-a22b", + "name": "Qwen3 VL 235B", + "display_name": "Qwen3 VL 235B", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -133799,25 +141858,18 @@ }, "attachment": true, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2026-01-16", + "last_updated": "2026-03-12", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08, - "context_over_200k": { - "input": 0.8, - "output": 4, - "cache_read": 0.16 - } + "input": 0.25, + "output": 1.5 }, "type": "chat" }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "Grok 4.1 Fast (Non-Reasoning)", - "display_name": "Grok 4.1 Fast (Non-Reasoning)", + "id": "google-gemma-3-27b-it", + "name": "Google Gemma 3 27B Instruct", + "display_name": "Google Gemma 3 27B Instruct", "modalities": { "input": [ "text", @@ -133828,8 +141880,8 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 198000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -133837,21 +141889,20 @@ "supported": false }, "attachment": true, - "open_weights": false, + "open_weights": true, "knowledge": "2025-07", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "release_date": "2025-11-04", + "last_updated": "2026-03-12", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.12, + "output": 0.2 }, "type": "chat" }, { - "id": "sonar-pro", - "name": "Sonar Pro", - "display_name": "Sonar Pro", + "id": "grok-4-3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ "text", @@ -133862,131 +141913,145 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 1000000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "release_date": "2026-04-18", + "last_updated": "2026-05-04", "cost": { - "input": 3, - "output": 15 + "input": 1.42, + "output": 2.83, + "cache_read": 0.23, + "tiers": [ + { + "input": 2.83, + "output": 5.67, + "cache_read": 0.45, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.83, + "output": 5.67, + "cache_read": 0.45 + } }, "type": "chat" }, { - "id": "pixtral-large-latest", - "name": "Pixtral Large (latest)", - "display_name": "Pixtral Large (latest)", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2024-11-04", + "release_date": "2026-04-24", + "last_updated": "2026-04-29", "cost": { - "input": 2, - "output": 6 + "input": 1.73, + "output": 3.796, + "cache_read": 0.33 }, "type": "chat" }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "zai-org-glm-5", + "name": "GLM 5", + "display_name": "GLM 5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 198000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-03-12", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "grok-4-20-beta-0309-reasoning", - "name": "Grok 4.20 (Reasoning)", - "display_name": "Grok 4.20 (Reasoning)", + "id": "deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 160000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -133994,74 +142059,71 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-09", - "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 12, - "cache_read": 0.4 + "extra_capabilities": { + "reasoning": { + "supported": true } }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-10", + "release_date": "2025-12-04", + "last_updated": "2026-03-24", + "cost": { + "input": 0.33, + "output": 0.48, + "cache_read": 0.16 + }, "type": "chat" }, { - "id": "gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "mistral-small-2603", + "name": "Mistral Small 4", + "display_name": "Mistral Small 4", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "open_weights": true, + "release_date": "2026-03-16", + "last_updated": "2026-04-09", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "input": 0.1875, + "output": 0.75 }, "type": "chat" }, { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "zai-org-glm-4.7-flash", + "name": "GLM 4.7 Flash", + "display_name": "GLM 4.7 Flash", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -134069,34 +142131,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": true, + "release_date": "2026-01-29", + "last_updated": "2026-03-12", "cost": { - "input": 0.276, - "output": 1.651, - "cache_read": 0.028, - "cache_write": 0.344 + "input": 0.125, + "output": 0.5 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 mini", - "display_name": "GPT-5.4 mini", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", @@ -134107,53 +142155,36 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 198000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "release_date": "2025-01-15", + "last_updated": "2026-04-12", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 3.75, + "output": 18.75, + "cache_read": 0.375, + "cache_write": 4.69 }, "type": "chat" }, { - "id": "qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "arcee-trinity-large-thinking", + "name": "Trinity Large Thinking", + "display_name": "Trinity Large Thinking", "modalities": { "input": [ "text" @@ -134163,13 +142194,14 @@ ] }, "limit": { - "context": 262144, + "context": 256000, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -134183,68 +142215,64 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "open_weights": true, + "release_date": "2026-04-02", + "last_updated": "2026-04-04", "cost": { - "input": 1.2, - "output": 6 + "input": 0.3125, + "output": 1.125, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "minimax-m2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "venice-uncensored-1-2", + "name": "Venice Uncensored 1.2", + "display_name": "Venice Uncensored 1.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "release_date": "2026-04-01", + "last_updated": "2026-04-19", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.2, + "output": 0.9 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "grok-41-fast", + "name": "Grok 4.1 Fast", + "display_name": "Grok 4.1 Fast", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 1000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -134252,82 +142280,55 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "knowledge": "2025-07", + "release_date": "2025-12-01", + "last_updated": "2026-04-09", "cost": { - "input": 6, - "output": 24, - "cache_read": 1.3, - "cache_write": 0 + "input": 0.23, + "output": 0.57, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "minimax-m27", + "name": "MiniMax M2.7", + "display_name": "MiniMax M2.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 198000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2026-03-18", + "last_updated": "2026-04-12", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 0.375, + "output": 1.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "gpt-5.4-nano", - "name": "GPT-5.4 nano", - "display_name": "GPT-5.4 nano", + "id": "openai-gpt-55", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ "text", @@ -134338,53 +142339,46 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "release_date": "2026-04-23", + "last_updated": "2026-04-25", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 6.25, + "output": 37.5, + "cache_read": 0.625, + "tiers": [ + { + "input": 12.5, + "output": 56.25, + "cache_read": 1.25, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 12.5, + "output": 56.25, + "cache_read": 1.25 + } }, "type": "chat" }, { - "id": "glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "nvidia-nemotron-cascade-2-30b-a3b", + "name": "Nemotron Cascade 2 30B A3B", + "display_name": "Nemotron Cascade 2 30B A3B", "modalities": { "input": [ "text" @@ -134394,8 +142388,8 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 256000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -134405,58 +142399,52 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2026-03-24", + "last_updated": "2026-04-09", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.14, + "output": 0.8 }, "type": "chat" }, { - "id": "mistral-large-latest", - "name": "Mistral Large (latest)", - "display_name": "Mistral Large (latest)", + "id": "mistral-small-3-2-24b-instruct", + "name": "Mistral Small 3.2 24B Instruct", + "display_name": "Mistral Small 3.2 24B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2025-12-02", + "release_date": "2026-01-15", + "last_updated": "2026-03-16", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.09375, + "output": 0.25 }, "type": "chat" }, { - "id": "mistral-small-2506", - "name": "Mistral Small 3.2", - "display_name": "Mistral Small 3.2", + "id": "nvidia-nemotron-3-nano-30b-a3b", + "name": "NVIDIA Nemotron 3 Nano 30B", + "display_name": "NVIDIA Nemotron 3 Nano 30B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -134473,19 +142461,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-06-20", - "last_updated": "2025-06-20", + "release_date": "2026-01-27", + "last_updated": "2026-03-12", "cost": { - "input": 0.1, + "input": 0.075, "output": 0.3 }, "type": "chat" }, { - "id": "gemma-3-12b-it", - "name": "Gemma 3 12B", - "display_name": "Gemma 3 12B", + "id": "openai-gpt-4o-mini-2024-07-18", + "name": "GPT-4o Mini", + "display_name": "GPT-4o Mini", "modalities": { "input": [ "text", @@ -134496,44 +142483,42 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "open_weights": false, + "release_date": "2026-02-28", + "last_updated": "2026-03-06", "cost": { - "input": 0, - "output": 0 + "input": 0.1875, + "output": 0.75, + "cache_read": 0.09375 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "zai-org-glm-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 198000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -134542,54 +142527,71 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "release_date": "2024-04-01", + "last_updated": "2026-04-04", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.85, + "output": 2.75, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "llama-3.2-3b", + "name": "Llama 3.2 3B", + "display_name": "Llama 3.2 3B", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-10-03", + "last_updated": "2026-03-12", + "cost": { + "input": 0.15, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "openai-gpt-52", + "name": "GPT-5.2", + "display_name": "GPT-5.2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, "output": 65536 }, "temperature": true, @@ -134598,43 +142600,22 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2025-08-31", + "release_date": "2025-12-13", + "last_updated": "2026-03-12", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.03, - "input_audio": 1 + "input": 2.19, + "output": 17.5, + "cache_read": 0.219 }, "type": "chat" }, { - "id": "gpt-5.2-chat-latest", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", + "id": "gemma-4-uncensored", + "name": "Gemma 4 Uncensored", + "display_name": "Gemma 4 Uncensored", "modalities": { "input": [ "text", @@ -134645,63 +142626,105 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 256000, + "output": 8192 }, - "temperature": false, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-04-13", + "last_updated": "2026-04-19", + "cost": { + "input": 0.1625, + "output": 0.5 + }, + "type": "chat" + }, + { + "id": "minimax-m25", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 198000, + "output": 32768 + }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2026-02-12", + "last_updated": "2026-04-12", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.34, + "output": 1.19, + "cache_read": 0.04 }, "type": "chat" }, { - "id": "gemma-3n-e2b-it", - "name": "Gemma 3n 2B", - "display_name": "Gemma 3n 2B", + "id": "openai-gpt-55-pro", + "name": "GPT-5.5 Pro", + "display_name": "GPT-5.5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2000 + "context": 1000000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "open_weights": false, + "release_date": "2026-04-24", + "last_updated": "2026-04-25", "cost": { - "input": 0, - "output": 0 + "input": 37.5, + "output": 225 }, "type": "chat" }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex mini", - "display_name": "GPT-5.1 Codex mini", + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", @@ -134712,10 +142735,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -134725,39 +142748,45 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", "effort_options": [ - "none", "low", "medium", "high" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-16", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 3.6, + "output": 18, + "cache_read": 0.36, + "cache_write": 4.5 }, "type": "chat" }, { - "id": "grok-4-fast", - "name": "Grok 4 Fast", - "display_name": "Grok 4 Fast", + "id": "kimi-k2-6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", @@ -134768,8 +142797,8 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -134777,113 +142806,131 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "open_weights": true, + "release_date": "2026-04-20", + "last_updated": "2026-04-30", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.85, + "output": 4.655, + "cache_read": 0.22 }, "type": "chat" }, { - "id": "gemini-3.1-flash-lite", - "name": "Gemini 3.1 Flash Lite", - "display_name": "Gemini 3.1 Flash Lite", + "id": "llama-3.3-70b", + "name": "Llama 3.3 70B", + "display_name": "Llama 3.3 70B", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-05-07", - "last_updated": "2026-05-07", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-04-06", + "last_updated": "2026-03-12", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "input": 0.7, + "output": 2.8 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-thinking", - "name": "Qwen3-Next 80B-A3B (Thinking)", - "display_name": "Qwen3-Next 80B-A3B (Thinking)", + "id": "claude-opus-4-6-fast", + "name": "Claude Opus 4.6 Fast", + "display_name": "Claude Opus 4.6 Fast", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-04-08", + "last_updated": "2026-04-08", "cost": { - "input": 0.5, - "output": 6 + "input": 36, + "output": 180, + "cache_read": 3.6, + "cache_write": 45 }, "type": "chat" }, { - "id": "grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "qwen3-5-35b-a3b", + "name": "Qwen 3.5 35B A3B", + "display_name": "Qwen 3.5 35B A3B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -134891,7 +142938,7 @@ }, "limit": { "context": 256000, - "output": 10000 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -134899,83 +142946,55 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "attachment": true, + "open_weights": true, + "release_date": "2026-02-25", + "last_updated": "2026-04-16", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 0.3125, + "output": 1.25, + "cache_read": 0.15625 }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "qwen3-5-397b-a17b", + "name": "Qwen 3.5 397B", + "display_name": "Qwen 3.5 397B", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": true, + "release_date": "2026-02-16", + "last_updated": "2026-04-16", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.75, + "output": 4.5 }, "type": "chat" }, { - "id": "gemma-3-4b-it", - "name": "Gemma 3 4B", - "display_name": "Gemma 3 4B", + "id": "grok-4-20-multi-agent", + "name": "Grok 4.20 Multi-Agent", + "display_name": "Grok 4.20 Multi-Agent", "modalities": { "input": [ "text", @@ -134986,40 +143005,58 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 2000000, + "output": 128000 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "open_weights": false, + "release_date": "2026-03-12", + "last_updated": "2026-05-07", "cost": { - "input": 0, - "output": 0 + "input": 1.42, + "output": 2.83, + "cache_read": 0.23, + "tiers": [ + { + "input": 2.83, + "output": 5.67, + "cache_read": 0.45, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.83, + "output": 5.67, + "cache_read": 0.45 + } }, "type": "chat" }, { - "id": "kimi-k2-thinking-turbo", - "name": "Kimi K2 Thinking Turbo", - "display_name": "Kimi K2 Thinking Turbo", + "id": "openai-gpt-54-mini", + "name": "GPT-5.4 Mini", + "display_name": "GPT-5.4 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -135027,38 +143064,24 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-27", + "last_updated": "2026-03-31", "cost": { - "input": 1.15, - "output": 8, - "cache_read": 0.15 + "input": 0.9375, + "output": 5.625, + "cache_read": 0.09375 }, "type": "chat" }, { - "id": "o1", - "name": "o1", - "display_name": "o1", + "id": "olafangensan-glm-4.7-flash-heretic", + "name": "GLM 4.7 Flash Heretic", + "display_name": "GLM 4.7 Flash Heretic", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -135066,55 +143089,40 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 24000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-04", + "last_updated": "2026-03-12", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.14, + "output": 0.8 }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "grok-4-20", + "name": "Grok 4.20", + "display_name": "Grok 4.20", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 2000000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -135122,23 +143130,37 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-12", + "last_updated": "2026-05-07", "cost": { - "input": 0.2, - "output": 1.1, - "cache_read": 0.03, - "cache_write": 0 + "input": 1.42, + "output": 2.83, + "cache_read": 0.23, + "tiers": [ + { + "input": 2.83, + "output": 5.67, + "cache_read": 0.45, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.83, + "output": 5.67, + "cache_read": 0.45 + } }, "type": "chat" }, { - "id": "gpt-5.4-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", @@ -135149,131 +143171,109 @@ ] }, "limit": { - "context": 1050000, + "context": 1000000, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", "effort": "high", "effort_options": [ + "low", "medium", "high", "xhigh" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 30, - "output": 180 + "input": 6, + "output": 30, + "cache_read": 0.6, + "cache_write": 7.5 }, "type": "chat" }, { - "id": "gpt-3.5-turbo", - "name": "GPT-3.5-turbo", - "display_name": "GPT-3.5-turbo", + "id": "qwen-3-6-plus", + "name": "Qwen 3.6 Plus Uncensored", + "display_name": "Qwen 3.6 Plus Uncensored", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 1000000, + "output": 65536 }, "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2021-09-01", - "release_date": "2023-03-01", - "last_updated": "2023-11-06", - "cost": { - "input": 0.5, - "output": 1.5, - "cache_read": 1.25 - }, - "type": "chat" - }, - { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 100000 - }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "release_date": "2026-04-06", + "last_updated": "2026-04-12", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.625, + "output": 3.75, + "cache_read": 0.0625, + "cache_write": 0.78, + "tiers": [ + { + "input": 2.5, + "output": 7.5, + "cache_read": 0.0625, + "cache_write": 0.78, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 7.5, + "cache_read": 0.0625, + "cache_write": 0.78 + } }, "type": "chat" }, { - "id": "qwen-vl-max", - "name": "Qwen-VL Max", - "display_name": "Qwen-VL Max", + "id": "openai-gpt-54-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ "text", @@ -135284,29 +143284,43 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-04-08", - "last_updated": "2025-08-13", + "release_date": "2026-03-05", + "last_updated": "2026-03-09", "cost": { - "input": 0.8, - "output": 3.2 + "input": 37.5, + "output": 225, + "tiers": [ + { + "input": 75, + "output": 337.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 75, + "output": 337.5 + } }, "type": "chat" }, { - "id": "sonar", - "name": "Sonar", - "display_name": "Sonar", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -135316,29 +143330,41 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "open_weights": true, + "release_date": "2026-04-24", + "last_updated": "2026-04-29", "cost": { - "input": 1, - "output": 1 + "input": 0.17, + "output": 0.35, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "qwen3-coder-flash", - "name": "Qwen3 Coder Flash", - "display_name": "Qwen3 Coder Flash", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen 3 235B A22B Instruct 2507", + "display_name": "Qwen 3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -135348,8 +143374,8 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -135357,32 +143383,35 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-04-29", + "last_updated": "2026-03-12", "cost": { - "input": 0.3, - "output": 1.5 + "input": 0.15, + "output": 0.75 }, "type": "chat" }, { - "id": "grok-4-3", - "name": "Grok 4.3", - "display_name": "Grok 4.3", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 30000 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -135390,26 +143419,42 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-05-01", - "last_updated": "2026-05-01", + "knowledge": "2025-01", + "release_date": "2025-12-19", + "last_updated": "2026-03-12", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2, - "context_over_200k": { - "input": 2.5, - "output": 5, - "cache_read": 0.4 - } + "input": 0.7, + "output": 3.75, + "cache_read": 0.07 }, "type": "chat" }, { - "id": "glm-4.5v", - "name": "GLM-4.5V", - "display_name": "GLM-4.5V", + "id": "qwen3-6-27b", + "name": "Qwen 3.6 27B", + "display_name": "Qwen 3.6 27B", "modalities": { "input": [ "text", @@ -135421,8 +143466,8 @@ ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -135431,31 +143476,31 @@ "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "open_weights": false, + "release_date": "2026-04-24", + "last_updated": "2026-04-29", "cost": { - "input": 0.6, - "output": 1.8 + "input": 0.325, + "output": 3.25 }, "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "qwen3-5-9b", + "name": "Qwen 3.5 9B", + "display_name": "Qwen 3.5 9B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 256000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -135463,33 +143508,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2026-03-05", + "last_updated": "2026-04-19", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 0.1, + "output": 0.15 }, "type": "chat" }, { - "id": "grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "qwen3-coder-480b-a35b-instruct-turbo", + "name": "Qwen 3 Coder 480B Turbo", + "display_name": "Qwen 3 Coder 480B Turbo", "modalities": { "input": [ "text" @@ -135500,100 +143532,122 @@ }, "limit": { "context": 256000, - "output": 64000 + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-02-26", "cost": { - "input": 3, - "output": 15, - "reasoning": 15, - "cache_read": 0.75 + "input": 0.35, + "output": 1.5, + "cache_read": 0.04 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-instruct", - "name": "Qwen3-Next 80B-A3B Instruct", - "display_name": "Qwen3-Next 80B-A3B Instruct", + "id": "claude-opus-4-7-fast", + "name": "Claude Opus 4.7 Fast", + "display_name": "Claude Opus 4.7 Fast", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-05-14", + "last_updated": "2026-05-14", "cost": { - "input": 0.5, - "output": 2 + "input": 36, + "output": 180, + "cache_read": 3.6, + "cache_write": 45 }, "type": "chat" }, { - "id": "gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "openai-gpt-52-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2025-08", + "release_date": "2025-01-15", + "last_updated": "2026-03-12", "cost": { - "input": 30, - "output": 60 + "input": 2.19, + "output": 17.5, + "cache_read": 0.219 }, "type": "chat" }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen 3 235B A22B Thinking 2507", + "display_name": "Qwen 3 235B A22B Thinking 2507", "modalities": { "input": [ "text" @@ -135603,8 +143657,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -135614,26 +143668,30 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2025-07", + "release_date": "2025-04-29", + "last_updated": "2026-03-12", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.45, + "output": 3.5 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "google-gemma-4-26b-a4b-it", + "name": "Google Gemma 4 26B A4B Instruct", + "display_name": "Google Gemma 4 26B A4B Instruct", "modalities": { "input": [ "text", @@ -135645,8 +143703,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -135654,38 +143712,24 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "release_date": "2026-04-02", + "last_updated": "2026-04-12", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.1625, + "output": 0.5 }, "type": "chat" }, { - "id": "glm-4.6v", - "name": "GLM-4.6V", - "display_name": "GLM-4.6V", + "id": "openai-gpt-4o-2024-11-20", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" @@ -135693,42 +143737,39 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "open_weights": false, + "release_date": "2026-02-28", + "last_updated": "2026-03-06", "cost": { - "input": 0.3, - "output": 0.9 + "input": 3.125, + "output": 12.5 }, "type": "chat" }, { - "id": "claude-opus-4-1-20250805", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "openai-gpt-54", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1000000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -135738,36 +143779,33 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-03-05", + "last_updated": "2026-03-09", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 3.13, + "output": 18.8, + "cache_read": 0.313 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, + "context": 1000000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -135777,77 +143815,77 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-16", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 6, + "output": 30, + "cache_read": 0.6, + "cache_write": 7.5 }, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "venice-uncensored-role-play", + "name": "Venice Role Play Uncensored", + "display_name": "Venice Role Play Uncensored", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "open_weights": true, + "release_date": "2026-02-20", + "last_updated": "2026-03-16", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.5, + "output": 2 }, "type": "chat" }, { - "id": "glm-4.5-flash", - "name": "GLM-4.5-Flash", - "display_name": "GLM-4.5-Flash", + "id": "zai-org-glm-5-1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ "text" @@ -135857,8 +143895,8 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 200000, + "output": 24000 }, "temperature": true, "tool_call": true, @@ -135866,35 +143904,43 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2026-04-07", + "last_updated": "2026-04-08", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 1.75, + "output": 5.5, + "cache_read": 0.325 }, "type": "chat" }, { - "id": "qwen3-vl-plus", - "name": "Qwen3-VL Plus", - "display_name": "Qwen3-VL Plus", + "id": "zai-org-glm-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 198000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -135914,33 +143960,35 @@ } }, "attachment": false, - "open_weights": false, + "open_weights": true, "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "release_date": "2025-12-24", + "last_updated": "2026-03-12", "cost": { - "input": 0.2, - "output": 1.6, - "reasoning": 4.8 + "input": 0.55, + "output": 2.65, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "grok-4-1-fast", - "name": "Grok 4.1 Fast", - "display_name": "Grok 4.1 Fast", + "id": "gemini-3-1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -135950,33 +143998,48 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "release_date": "2026-02-19", + "last_updated": "2026-03-12", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 2.5, + "output": 15, + "cache_read": 0.5, + "cache_write": 0.5, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + } }, "type": "chat" }, { - "id": "claude-sonnet-4-20250514", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "kimi-k2-5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -135984,23 +144047,33 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-04", + "release_date": "2026-01-27", + "last_updated": "2026-04-30", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.56, + "output": 3.5, + "cache_read": 0.22 }, "type": "chat" }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "Qwen3-Coder 480B-A35B Instruct", - "display_name": "Qwen3-Coder 480B-A35B Instruct", + "id": "aion-labs-aion-2-0", + "name": "Aion 2.0", + "display_name": "Aion 2.0", "modalities": { "input": [ "text" @@ -136010,8 +144083,41 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 32768 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-24", + "last_updated": "2026-04-12", + "cost": { + "input": 1, + "output": 2, + "cache_read": 0.25 + }, + "type": "chat" + }, + { + "id": "qwen3-next-80b", + "name": "Qwen 3 Next 80b", + "display_name": "Qwen 3 Next 80b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -136020,82 +144126,53 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "knowledge": "2025-07", + "release_date": "2025-04-29", + "last_updated": "2026-03-12", "cost": { - "input": 1.5, - "output": 7.5 + "input": 0.35, + "output": 1.9 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "z-ai-glm-5v-turbo", + "name": "GLM 5V Turbo", + "display_name": "GLM 5V Turbo", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 200000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "release_date": "2026-04-01", + "last_updated": "2026-04-12", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1.5, + "output": 5, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "openai-gpt-oss-120b", + "name": "OpenAI GPT OSS 120B", + "display_name": "OpenAI GPT OSS 120B", "modalities": { "input": [ "text" @@ -136105,8 +144182,8 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -136114,33 +144191,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "knowledge": "2025-07", + "release_date": "2025-11-06", + "last_updated": "2026-05-06", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 0.07, + "output": 0.3 }, "type": "chat" }, { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ "text", @@ -136151,130 +144216,116 @@ ] }, "limit": { - "context": 1047576, + "context": 198000, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-12-06", + "last_updated": "2026-04-12", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.03 + "input": 6, + "output": 30, + "cache_read": 0.6, + "cache_write": 7.5 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-20250219", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "mercury-2", + "name": "Mercury 2", + "display_name": "Mercury 2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 50000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] - } + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2026-02-20", + "last_updated": "2026-04-09", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.3125, + "output": 0.9375, + "cache_read": 0.03125 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3-Coder 30B-A3B Instruct", - "display_name": "Qwen3-Coder 30B-A3B Instruct", + "id": "openai-gpt-53-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": true, + "open_weights": false, + "release_date": "2026-02-24", + "last_updated": "2026-03-12", "cost": { - "input": 0.45, - "output": 2.25 + "input": 2.19, + "output": 17.5, + "cache_read": 0.219 }, "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "google-gemma-4-31b-it", + "name": "Google Gemma 4 31B Instruct", + "display_name": "Google Gemma 4 31B Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -136282,27 +144333,29 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2026-04-03", + "last_updated": "2026-04-12", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 0.175, + "output": 0.5 }, "type": "chat" - }, + } + ] + }, + "fireworks-ai": { + "id": "fireworks-ai", + "name": "Fireworks AI", + "display_name": "Fireworks AI", + "api": "https://api.fireworks.ai/inference/v1/", + "doc": "https://fireworks.ai/docs/", + "models": [ { - "id": "mimo-v2-pro", - "name": "MiMo-V2-Pro", - "display_name": "MiMo-V2-Pro", + "id": "accounts/fireworks/models/minimax-m2p7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ "text" @@ -136312,8 +144365,8 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 196608, + "output": 196608 }, "temperature": true, "tool_call": true, @@ -136333,41 +144386,33 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": true, + "release_date": "2026-04-12", + "last_updated": "2026-04-12", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2, - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "accounts/fireworks/models/glm-4p7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 198000, + "output": 198000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -136376,33 +144421,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.6, + "output": 2.2, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "gpt-5-pro", - "name": "GPT-5 Pro", - "display_name": "GPT-5 Pro", + "id": "accounts/fireworks/models/qwen3p6-plus", + "name": "Qwen 3.6 Plus", + "display_name": "Qwen 3.6 Plus", "modalities": { "input": [ "text", @@ -136413,50 +144455,33 @@ ] }, "limit": { - "context": 400000, - "output": 272000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "release_date": "2026-04-04", + "last_updated": "2026-04-04", "cost": { - "input": 15, - "output": 120 + "input": 0.5, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "accounts/fireworks/models/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -136471,33 +144496,33 @@ "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "minimax-m2.5-highspeed", - "name": "MiniMax-M2.5-highspeed", - "display_name": "MiniMax-M2.5-highspeed", + "id": "accounts/fireworks/models/kimi-k2p6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -136507,25 +144532,30 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2026-02-13", - "last_updated": "2026-02-13", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "qwen-turbo", - "name": "Qwen Turbo", - "display_name": "Qwen Turbo", + "id": "accounts/fireworks/models/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -136535,8 +144565,8 @@ ] }, "limit": { - "context": 1000000, - "output": 16384 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -136546,44 +144576,34 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-11-01", - "last_updated": "2025-04-28", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { "input": 0.05, - "output": 0.2, - "reasoning": 0.5 + "output": 0.2 }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5 (latest)", - "display_name": "Claude Sonnet 4.5 (latest)", + "id": "accounts/fireworks/models/deepseek-v3p2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 160000, + "output": 160000 }, "temperature": true, "tool_call": true, @@ -136593,97 +144613,88 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.56, + "output": 1.68, + "cache_read": 0.28 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "accounts/fireworks/models/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "attachment": false, + "open_weights": true, + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.6, + "output": 2.5, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "accounts/fireworks/models/glm-4p5", + "name": "GLM 4.5", + "display_name": "GLM 4.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -136692,40 +144703,29 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "glm-4.7-flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "accounts/fireworks/models/minimax-m2p5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -136735,8 +144735,8 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 196608, + "output": 196608 }, "temperature": true, "tool_call": true, @@ -136746,37 +144746,43 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "mimo-v2-flash", - "name": "MiMo-V2-Flash", - "display_name": "MiMo-V2-Flash", + "id": "accounts/fireworks/models/kimi-k2p5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -136797,20 +144803,20 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "qwen3.6-max-preview", - "name": "Qwen3.6 Max Preview", - "display_name": "Qwen3.6 Max Preview", + "id": "accounts/fireworks/models/minimax-m2p1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -136820,8 +144826,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 200000 }, "temperature": true, "tool_call": true, @@ -136841,69 +144847,64 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-20", - "last_updated": "2026-04-20", + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 1.3, - "output": 7.8, - "cache_read": 0.13, - "cache_write": 1.625 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "gpt-5-chat-latest", - "name": "GPT-5 Chat (latest)", - "display_name": "GPT-5 Chat (latest)", + "id": "accounts/fireworks/models/deepseek-v3p1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 163840, + "output": 163840 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 1.25, - "output": 10 + "input": 0.56, + "output": 1.68 }, "type": "chat" }, { - "id": "claude-opus-4-20250514", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "accounts/fireworks/models/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -136911,27 +144912,28 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "qwen2-5-vl-72b-instruct", - "name": "Qwen2.5-VL 72B Instruct", - "display_name": "Qwen2.5-VL 72B Instruct", + "id": "accounts/fireworks/models/glm-4p5-air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -136939,134 +144941,163 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "knowledge": "2025-04", + "release_date": "2025-08-01", + "last_updated": "2025-08-01", "cost": { - "input": 2.8, - "output": 8.4 + "input": 0.22, + "output": 0.88 }, "type": "chat" }, { - "id": "gpt-5.5-pro", - "name": "GPT-5.5 Pro", - "display_name": "GPT-5.5 Pro", + "id": "accounts/fireworks/models/glm-5", + "name": "GLM 5", + "display_name": "GLM 5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 202752, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", - "cost": { - "input": 30, - "output": 180, - "context_over_200k": { - "input": 60, - "output": 270 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "cost": { + "input": 1, + "output": 3.2, + "cache_read": 0.5 + }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "accounts/fireworks/models/glm-5p1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 202800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "devstral-small-2507", - "name": "Devstral Small", - "display_name": "Devstral Small", + "id": "accounts/fireworks/routers/kimi-k2p5-turbo", + "name": "Kimi K2.5 Turbo", + "display_name": "Kimi K2.5 Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-07-10", - "last_updated": "2025-07-10", + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "accounts/fireworks/models/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -137076,8 +145107,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -137098,34 +145129,39 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.6, - "output": 2.5, + "input": 1.74, + "output": 3.48, "cache_read": 0.15 }, "type": "chat" - }, + } + ] + }, + "alibaba": { + "id": "alibaba", + "name": "alibaba", + "display_name": "alibaba", + "api": "https://dashscope-intl.aliyuncs.com/compatible-mode/v1", + "doc": "https://www.alibabacloud.com/help/en/model-studio/models", + "models": [ { - "id": "gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash Lite", - "display_name": "Gemini 2.0 Flash Lite", + "id": "qwen2-5-7b-instruct", + "name": "Qwen2.5 7B Instruct", + "display_name": "Qwen2.5 7B Instruct", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 131072, "output": 8192 }, "temperature": true, @@ -137133,56 +145169,59 @@ "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.075, - "output": 0.3 + "input": 0.175, + "output": 0.7 }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "qwen3-livetranslate-flash-realtime", + "name": "Qwen3-LiveTranslate Flash Realtime", + "display_name": "Qwen3-LiveTranslate Flash Realtime", "modalities": { "input": [ "text", "image", - "pdf" + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 53248, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 10, + "output": 10, + "input_audio": 10, + "output_audio": 38 }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "qwen2-5-vl-72b-instruct", + "name": "Qwen2.5-VL 72B Instruct", + "display_name": "Qwen2.5-VL 72B Instruct", "modalities": { "input": [ "text", @@ -137192,61 +145231,6 @@ "text" ] }, - "limit": { - "context": 400000, - "output": 128000 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, - "type": "chat" - }, - { - "id": "grok-3", - "name": "Grok 3", - "display_name": "Grok 3", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, "limit": { "context": 131072, "output": 8192 @@ -137257,55 +145241,67 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 2.8, + "output": 8.4 }, "type": "chat" }, { - "id": "grok-4-fast-non-reasoning", - "name": "Grok 4 Fast (Non-Reasoning)", - "display_name": "Grok 4 Fast (Non-Reasoning)", + "id": "qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.4, + "output": 2.4, + "reasoning": 2.4 }, "type": "chat" }, { - "id": "sonar-reasoning-pro", - "name": "Sonar Reasoning Pro", - "display_name": "Sonar Reasoning Pro", + "id": "qwen3-vl-plus", + "name": "Qwen3 VL Plus", + "display_name": "Qwen3 VL Plus", "modalities": { "input": [ "text", @@ -137316,89 +145312,106 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 2, - "output": 8 + "input": 0.2, + "output": 1.6, + "reasoning": 4.8 }, "type": "chat" - } - ] - }, - "google-vertex": { - "id": "google-vertex", - "name": "Vertex", - "display_name": "Vertex", - "doc": "https://cloud.google.com/vertex-ai/generative-ai/docs/models", - "models": [ + }, { - "id": "gemini-2.0-flash", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "qwen3-vl-235b-a22b", + "name": "Qwen3-VL 235B-A22B", + "display_name": "Qwen3-VL 235B-A22B", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.025 + "input": 0.7, + "output": 2.8, + "reasoning": 8.4 }, "type": "chat" }, { - "id": "gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "qwen3.6-27b", + "name": "Qwen3.6 27B", + "display_name": "Qwen3.6 27B", "modalities": { "input": [ "text", "image", "video", - "audio", - "pdf" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, @@ -137410,151 +145423,146 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "open_weights": true, + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "gemini-flash-latest", - "name": "Gemini Flash Latest", - "display_name": "Gemini Flash Latest", + "id": "qwq-plus", + "name": "QwQ Plus", + "display_name": "QwQ Plus", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 32768, + "min": 0, + "max": 32768 + } }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2024-04", + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.383 + "input": 0.8, + "output": 2.4 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-06-17", - "name": "Gemini 2.5 Flash Lite Preview 06-17", - "display_name": "Gemini 2.5 Flash Lite Preview 06-17", + "id": "qwen3-8b", + "name": "Qwen3 8B", + "display_name": "Qwen3 8B", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.18, + "output": 0.7, + "reasoning": 2.1 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "qwen3.5-122b-a10b", + "name": "Qwen3.5 122B-A10B", + "display_name": "Qwen3.5 122B-A10B", "modalities": { "input": [ "text", "image", - "audio", "video", - "pdf" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, @@ -137566,99 +145574,71 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "open_weights": true, + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.383 + "input": 0.4, + "output": 3.2 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-09-2025", - "name": "Gemini 2.5 Flash Preview 09-25", - "display_name": "Gemini 2.5 Flash Preview 09-25", + "id": "qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.383 + "input": 1.2, + "output": 6 }, "type": "chat" }, { - "id": "zai-org/glm-5-maas", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "qwen3-235b-a22b", + "name": "Qwen3 235B A22B", + "display_name": "Qwen3 235B A22B", "modalities": { "input": [ "text" @@ -137668,14 +145648,19 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { @@ -137690,31 +145675,34 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.1 + "input": 0.7, + "output": 2.8, + "reasoning": 8.4 }, "type": "chat" }, { - "id": "zai-org/glm-4.7-maas", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "qwen3.5-397b-a17b", + "name": "Qwen3.5 397B-A17B", + "display_name": "Qwen3.5 397B-A17B", "modalities": { "input": [ "text", - "pdf" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -137733,88 +145721,112 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-06", - "last_updated": "2026-01-06", + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { "input": 0.6, - "output": 2.2 + "output": 3.6 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-v3.2-maas", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "qwen-flash", + "name": "Qwen Flash", + "display_name": "Qwen Flash", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-17", - "last_updated": "2026-04-04", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.56, - "output": 1.68, - "cache_read": 0.056 + "input": 0.05, + "output": 0.4 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-v3.1-maas", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "qwen-omni-turbo-realtime", + "name": "Qwen-Omni Turbo Realtime", + "display_name": "Qwen-Omni Turbo Realtime", "modalities": { "input": [ "text", - "pdf" + "image", + "audio" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 163840, - "output": 32768 + "context": 32768, + "output": 2048 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "cost": { - "input": 0.6, - "output": 1.7 + "input": 0.27, + "output": 1.07, + "input_audio": 4.44, + "output_audio": 8.89 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b-maas", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "qwen-mt-turbo", + "name": "Qwen Mt Turbo", + "display_name": "Qwen Mt Turbo", "modalities": { "input": [ "text" @@ -137824,29 +145836,29 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 16384, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 0.09, - "output": 0.36 + "input": 0.16, + "output": 0.49 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b-maas", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "qwen-turbo", + "name": "Qwen Turbo", + "display_name": "Qwen Turbo", "modalities": { "input": [ "text" @@ -137857,28 +145869,52 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-11-01", + "last_updated": "2025-04-28", "cost": { - "input": 0.07, - "output": 0.25 + "input": 0.05, + "output": 0.2, + "reasoning": 0.5 }, "type": "chat" }, { - "id": "meta/llama-3.3-70b-instruct-maas", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "qwen-max", + "name": "Qwen Max", + "display_name": "Qwen Max", "modalities": { "input": [ "text" @@ -137888,7 +145924,7 @@ ] }, "limit": { - "context": 128000, + "context": 32768, "output": 8192 }, "temperature": true, @@ -137896,21 +145932,27 @@ "reasoning": { "supported": false }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" + }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-04-03", + "last_updated": "2025-01-25", "cost": { - "input": 0.72, - "output": 0.72 + "input": 1.6, + "output": 6.4 }, "type": "chat" }, { - "id": "meta/llama-4-maverick-17b-128e-instruct-maas", - "name": "Llama 4 Maverick 17B 128E Instruct", - "display_name": "Llama 4 Maverick 17B 128E Instruct", + "id": "qwen2-5-vl-7b-instruct", + "name": "Qwen2.5-VL 7B Instruct", + "display_name": "Qwen2.5-VL 7B Instruct", "modalities": { "input": [ "text", @@ -137921,7 +145963,7 @@ ] }, "limit": { - "context": 524288, + "context": 131072, "output": 8192 }, "temperature": true, @@ -137929,21 +145971,21 @@ "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { "input": 0.35, - "output": 1.15 + "output": 1.05 }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-instruct-2507-maas", - "name": "Qwen3 235B A22B Instruct", - "display_name": "Qwen3 235B A22B Instruct", + "id": "qwen2-5-32b-instruct", + "name": "Qwen2.5 32B Instruct", + "display_name": "Qwen2.5 32B Instruct", "modalities": { "input": [ "text" @@ -137953,40 +145995,74 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-13", - "last_updated": "2025-08-13", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.22, - "output": 0.88 + "input": 0.7, + "output": 2.8 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking-maas", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "qwen3-asr-flash", + "name": "Qwen3-ASR Flash", + "display_name": "Qwen3-ASR Flash", "modalities": { "input": [ + "audio" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 53248, + "output": 4096 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-09-08", + "last_updated": "2025-09-08", + "cost": { + "input": 0.035, + "output": 0.035 + }, + "type": "chat" + }, + { + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", + "modalities": { + "input": [ + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -138006,246 +146082,333 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.6, - "output": 2.5 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 0.625, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5 + } }, "type": "chat" }, { - "id": "gemini-flash-lite-latest", - "name": "Gemini Flash-Lite Latest", - "display_name": "Gemini Flash-Lite Latest", + "id": "qwen3-coder-flash", + "name": "Qwen3 Coder Flash", + "display_name": "Qwen3 Coder Flash", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 1000000, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.3, + "output": 1.5 }, "type": "chat" }, { - "id": "gemini-2.5-pro-preview-05-06", - "name": "Gemini 2.5 Pro Preview 05-06", - "display_name": "Gemini 2.5 Pro Preview 05-06", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-06", - "last_updated": "2025-05-06", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 + "input": 0.7, + "output": 2.8, + "reasoning": 8.4 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview-customtools", - "name": "Gemini 3.1 Pro Preview Custom Tools", - "display_name": "Gemini 3.1 Pro Preview Custom Tools", + "id": "qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", + "cost": { + "input": 0.5, + "output": 6 + }, + "type": "chat" + }, + { + "id": "qwen-mt-plus", + "name": "Qwen Mt Plus", + "display_name": "Qwen Mt Plus", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16384, + "output": 8192 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "knowledge": "2024-04", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 2.46, + "output": 7.37 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-09-2025", - "name": "Gemini 2.5 Flash Lite Preview 09-25", - "display_name": "Gemini 2.5 Flash Lite Preview 09-25", + "id": "qwen-vl-plus", + "name": "Qwen-VL Plus", + "display_name": "Qwen-VL Plus", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-08-15", + "cost": { + "input": 0.21, + "output": 0.63 + }, + "type": "chat" + }, + { + "id": "qwen-omni-turbo", + "name": "Qwen-Omni Turbo", + "display_name": "Qwen-Omni Turbo", "modalities": { "input": [ "text", "image", "audio", - "video", - "pdf" + "video" + ], + "output": [ + "text", + "audio" + ] + }, + "limit": { + "context": 32768, + "output": 2048 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01-19", + "last_updated": "2025-03-26", + "cost": { + "input": 0.07, + "output": 0.27, + "input_audio": 4.44, + "output_audio": 8.89 + }, + "type": "chat" + }, + { + "id": "qwen3-vl-30b-a3b", + "name": "Qwen3-VL 30B-A3B", + "display_name": "Qwen3-VL 30B-A3B", + "modalities": { + "input": [ + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.2, + "output": 0.8, + "reasoning": 2.4 }, "type": "chat" }, { - "id": "gemini-3.1-flash-lite-preview", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "qwen3.5-35b-a3b", + "name": "Qwen3.5 35B-A3B", + "display_name": "Qwen3.5 35B-A3B", "modalities": { "input": [ "text", "image", "video", - "audio", - "pdf" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, @@ -138256,40 +146419,75 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "open_weights": true, + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "output": 2 + }, + "type": "chat" + }, + { + "id": "qwen-vl-ocr", + "name": "Qwen Vl Ocr", + "display_name": "Qwen Vl Ocr", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 34096, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-10-28", + "last_updated": "2025-04-13", + "cost": { + "input": 0.72, + "output": 0.72 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "qwen3.6-35b-a3b", + "name": "Qwen3.6 35B-A3B", + "display_name": "Qwen3.6 35B-A3B", "modalities": { "input": [ "text", "image", "video", - "audio", - "pdf" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, @@ -138301,56 +146499,43 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "open_weights": true, + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.248, + "output": 1.485 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "qwen3-omni-flash", + "name": "Qwen3-Omni Flash", + "display_name": "Qwen3-Omni Flash", "modalities": { "input": [ "text", "image", - "video", "audio", - "pdf" + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 65536, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -138361,101 +146546,95 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2024-04", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "context_over_200k": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 - } + "input": 0.43, + "output": 1.66, + "input_audio": 3.81, + "output_audio": 15.11 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-05-20", - "name": "Gemini 2.5 Flash Preview 05-20", - "display_name": "Gemini 2.5 Flash Preview 05-20", + "id": "qwen2-5-14b-instruct", + "name": "Qwen2.5 14B Instruct", + "display_name": "Qwen2.5 14B Instruct", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", + "cost": { + "input": 0.35, + "output": 1.4 }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "type": "chat" + }, + { + "id": "qwen2-5-72b-instruct", + "name": "Qwen2.5 72B Instruct", + "display_name": "Qwen2.5 72B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.0375 + "input": 1.4, + "output": 5.6 }, "type": "chat" }, { - "id": "gemini-embedding-001", - "name": "Gemini Embedding 001", - "display_name": "Gemini Embedding 001", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "Qwen3-Coder 480B-A35B Instruct", + "display_name": "Qwen3-Coder 480B-A35B Instruct", "modalities": { "input": [ "text" @@ -138465,44 +146644,41 @@ ] }, "limit": { - "context": 2048, - "output": 3072 + "context": 262144, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.15, - "output": 0 + "input": 1.5, + "output": 7.5 }, - "type": "embedding" + "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "qvq-max", + "name": "QVQ Max", + "display_name": "QVQ Max", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -138510,60 +146686,31 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2024-04", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 1.2, + "output": 4.8 }, "type": "chat" }, { - "id": "gemini-2.5-pro-preview-06-05", - "name": "Gemini 2.5 Pro Preview 06-05", - "display_name": "Gemini 2.5 Pro Preview 06-05", + "id": "qwen3.6-max-preview", + "name": "Qwen3.6 Max Preview", + "display_name": "Qwen3.6 Max Preview", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, @@ -138575,211 +146722,190 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "knowledge": "2025-04", + "release_date": "2026-04-20", + "last_updated": "2026-04-20", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 + "input": 1.3, + "output": 7.8, + "cache_read": 0.13, + "cache_write": 1.625 }, "type": "chat" }, { - "id": "gemini-3.1-flash-lite", - "name": "Gemini 3.1 Flash Lite", - "display_name": "Gemini 3.1 Flash Lite", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder 30B-A3B Instruct", + "display_name": "Qwen3-Coder 30B-A3B Instruct", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-05-07", - "last_updated": "2026-05-07", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "input": 0.45, + "output": 2.25 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-04-17", - "name": "Gemini 2.5 Flash Preview 04-17", - "display_name": "Gemini 2.5 Flash Preview 04-17", + "id": "qwen3-omni-flash-realtime", + "name": "Qwen3-Omni Flash Realtime", + "display_name": "Qwen3-Omni Flash Realtime", "modalities": { "input": [ "text", "image", "audio", - "video", - "pdf" + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 65536, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-04-17", - "last_updated": "2025-04-17", + "knowledge": "2024-04", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.0375 + "input": 0.52, + "output": 1.99, + "input_audio": 4.57, + "output_audio": 18.13 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", + "cost": { + "input": 0.5, + "output": 2 + }, + "type": "chat" + }, + { + "id": "qwen3.5-27b", + "name": "Qwen3.5 27B", + "display_name": "Qwen3.5 27B", "modalities": { "input": [ "text", "image", - "audio", "video", - "pdf" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "open_weights": true, + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.3, + "output": 2.4 }, "type": "chat" }, { - "id": "gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash Lite", - "display_name": "Gemini 2.0 Flash Lite", + "id": "qwen-vl-max", + "name": "Qwen-VL Max", + "display_name": "Qwen-VL Max", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 131072, "output": 8192 }, "temperature": true, @@ -138787,29 +146913,21 @@ "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2024-04", + "release_date": "2024-04-08", + "last_updated": "2025-08-13", "cost": { - "input": 0.075, - "output": 0.3 + "input": 0.8, + "output": 3.2 }, "type": "chat" - } - ] - }, - "groq": { - "id": "groq", - "name": "Groq", - "display_name": "Groq", - "doc": "https://console.groq.com/docs/models", - "models": [ + }, { - "id": "gemma2-9b-it", - "name": "Gemma 2 9B", - "display_name": "Gemma 2 9B", + "id": "qwen-plus-character-ja", + "name": "Qwen Plus Character (Japanese)", + "display_name": "Qwen Plus Character (Japanese)", "modalities": { "input": [ "text" @@ -138820,7 +146938,7 @@ }, "limit": { "context": 8192, - "output": 8192 + "output": 512 }, "temperature": true, "tool_call": true, @@ -138828,31 +146946,35 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2024-06-27", - "last_updated": "2024-06-27", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.5, + "output": 1.4 }, "type": "chat" }, { - "id": "mistral-saba-24b", - "name": "Mistral Saba 24B", - "display_name": "Mistral Saba 24B", + "id": "qwen2-5-omni-7b", + "name": "Qwen2.5-Omni 7B", + "display_name": "Qwen2.5-Omni 7B", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { "context": 32768, - "output": 32768 + "output": 2048 }, "temperature": true, "tool_call": true, @@ -138860,20 +146982,21 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-08", - "release_date": "2025-02-06", - "last_updated": "2025-02-06", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-12", + "last_updated": "2024-12", "cost": { - "input": 0.79, - "output": 0.79 + "input": 0.1, + "output": 0.4, + "input_audio": 6.76 }, "type": "chat" }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "qwen-plus", + "name": "Qwen Plus", + "display_name": "Qwen Plus", "modalities": { "input": [ "text" @@ -138883,35 +147006,53 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" + }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-09-11", "cost": { - "input": 0.75, - "output": 0.99 + "input": 0.4, + "output": 1.2, + "reasoning": 4 }, "type": "chat" }, { - "id": "llama-guard-3-8b", - "name": "Llama Guard 3 8B", - "display_name": "Llama Guard 3 8B", + "id": "qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", "modalities": { "input": [ "text" @@ -138921,28 +147062,29 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1000000, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.2, - "output": 0.2 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "llama-3.3-70b-versatile", - "name": "Llama 3.3 70B Versatile", - "display_name": "Llama 3.3 70B Versatile", + "id": "qwen3-14b", + "name": "Qwen3 14B", + "display_name": "Qwen3 14B", "modalities": { "input": [ "text" @@ -138953,28 +147095,46 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.59, - "output": 0.79 + "input": 0.35, + "output": 1.4, + "reasoning": 4.2 }, "type": "chat" }, { - "id": "allam-2-7b", - "name": "ALLaM-2-7b", - "display_name": "ALLaM-2-7b", + "id": "qwen3-coder-plus-2025-09-23", + "name": "Qwen3 Coder Plus 2025 09 23", + "display_name": "Qwen3 Coder Plus 2025 09 23", "modalities": { "input": [ "text" @@ -138984,40 +147144,57 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 1000000, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-09", - "last_updated": "2024-09", - "cost": { - "input": 0, - "output": 0 + "type": "chat" + }, + { + "id": "qwen3-coder-plus-2025-07-22", + "name": "Qwen3 Coder Plus 2025 07 22", + "display_name": "Qwen3 Coder Plus 2025 07 22", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 65536 }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, "type": "chat" }, { - "id": "whisper-large-v3", - "name": "Whisper Large V3", - "display_name": "Whisper Large V3", + "id": "qwen-vl-ocr-latest", + "name": "Qwen Vl Ocr Latest", + "display_name": "Qwen Vl Ocr Latest", "modalities": { "input": [ - "audio" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 448, - "output": 448 + "context": 34096, + "output": 4096 }, "temperature": true, "tool_call": false, @@ -139025,23 +147202,16 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-09", - "release_date": "2023-09-01", - "last_updated": "2025-09-05", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "llama-3.1-8b-instant", - "name": "Llama 3.1 8B Instant", - "display_name": "Llama 3.1 8B Instant", + "id": "qvq-max-2025-05-15", + "name": "Qvq Max 2025 05 15", + "display_name": "Qvq Max 2025 05 15", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -139049,28 +147219,26 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 16384, + "min": 0, + "max": 16384 + } }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 0.05, - "output": 0.08 - }, "type": "chat" }, { - "id": "llama3-70b-8192", - "name": "Llama 3 70B", - "display_name": "Llama 3 70B", + "id": "qwen-long", + "name": "Qwen Long", + "display_name": "Qwen Long", "modalities": { "input": [ "text" @@ -139080,29 +147248,21 @@ ] }, "limit": { - "context": 8192, + "context": 1000000, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-03", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", - "cost": { - "input": 0.59, - "output": 0.79 - }, "type": "chat" }, { - "id": "qwen-qwq-32b", - "name": "Qwen QwQ 32B", - "display_name": "Qwen QwQ 32B", + "id": "qwen-turbo-latest", + "name": "Qwen Turbo Latest", + "display_name": "Qwen Turbo Latest", "modalities": { "input": [ "text" @@ -139119,55 +147279,61 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-11-27", - "last_updated": "2024-11-27", - "cost": { - "input": 0.29, - "output": 0.39 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "whisper-large-v3-turbo", - "name": "Whisper Large v3 Turbo", - "display_name": "Whisper Large v3 Turbo", + "id": "qwen-turbo-2024-09-19", + "name": "Qwen Turbo 2024 09 19", + "display_name": "Qwen Turbo 2024 09 19", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 448, - "output": 448 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-01", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "llama3-8b-8192", - "name": "Llama 3 8B", - "display_name": "Llama 3 8B", + "id": "qwen-flash-2025-07-28", + "name": "Qwen Flash 2025 07 28", + "display_name": "Qwen Flash 2025 07 28", "modalities": { "input": [ "text" @@ -139177,97 +147343,118 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-03", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", - "cost": { - "input": 0.05, - "output": 0.08 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "canopylabs/orpheus-arabic-saudi", - "name": "Orpheus Arabic Saudi", - "display_name": "Orpheus Arabic Saudi", + "id": "qwen-plus-latest", + "name": "Qwen Plus Latest", + "display_name": "Qwen Plus Latest", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 4000, - "output": 50000 + "context": 1000000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-12-16", - "release_date": "2025-12-16", - "last_updated": "2025-12-16", - "cost": { - "input": 40, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "canopylabs/orpheus-v1-english", - "name": "Orpheus V1 English", - "display_name": "Orpheus V1 English", + "id": "qwen-plus-2024-09-19", + "name": "Qwen Plus 2024 09 19", + "display_name": "Qwen Plus 2024 09 19", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 4000, - "output": 50000 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-12-19", - "release_date": "2025-12-19", - "last_updated": "2025-12-19", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "meta-llama/llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout 17B", - "display_name": "Llama 4 Scout 17B", + "id": "qwen-plus-2025-07-14", + "name": "Qwen Plus 2025 07 14", + "display_name": "Qwen Plus 2025 07 14", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -139275,28 +147462,90 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", - "cost": { - "input": 0.11, - "output": 0.34 + "type": "chat" + }, + { + "id": "qwen-plus-2025-09-11", + "name": "Qwen Plus 2025 09 11", + "display_name": "Qwen Plus 2025 09 11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" + }, + "attachment": false, "type": "chat" }, { - "id": "meta-llama/llama-prompt-guard-2-22m", - "name": "Llama Prompt Guard 2 22M", - "display_name": "Llama Prompt Guard 2 22M", + "id": "qwen-max-latest", + "name": "Qwen Max Latest", + "display_name": "Qwen Max Latest", "modalities": { "input": [ "text" @@ -139306,73 +147555,68 @@ ] }, "limit": { - "context": 512, - "output": 512 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-01", - "cost": { - "input": 0.03, - "output": 0.03 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "meta-llama/llama-guard-4-12b", - "name": "Llama Guard 4 12B", - "display_name": "Llama Guard 4 12B", + "id": "qwen-max-2024-09-19", + "name": "Qwen Max 2024 09 19", + "display_name": "Qwen Max 2024 09 19", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 1024 + "context": 32768, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", - "cost": { - "input": 0.2, - "output": 0.2 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "meta-llama/llama-4-maverick-17b-128e-instruct", - "name": "Llama 4 Maverick 17B", - "display_name": "Llama 4 Maverick 17B", + "id": "qwen-max-2024-04-28", + "name": "Qwen Max 2024 04 28", + "display_name": "Qwen Max 2024 04 28", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 8000, + "output": 2000 }, "temperature": true, "tool_call": true, @@ -139380,20 +147624,12 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", - "cost": { - "input": 0.2, - "output": 0.6 - }, "type": "chat" }, { - "id": "meta-llama/llama-prompt-guard-2-86m", - "name": "Llama Prompt Guard 2 86M", - "display_name": "Llama Prompt Guard 2 86M", + "id": "qwen-max-2024-04-03", + "name": "Qwen Max 2024 04 03", + "display_name": "Qwen Max 2024 04 03", "modalities": { "input": [ "text" @@ -139403,29 +147639,21 @@ ] }, "limit": { - "context": 512, - "output": 512 + "context": 8000, + "output": 2000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-01", - "cost": { - "input": 0.04, - "output": 0.04 - }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "qwen-max-2025-01-25", + "name": "Qwen Max 2025 01 25", + "display_name": "Qwen Max 2025 01 25", "modalities": { "input": [ "text" @@ -139436,33 +147664,26 @@ }, "limit": { "context": 131072, - "output": 65536 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 0.075, - "output": 0.3 - }, "type": "chat" }, { - "id": "openai/gpt-oss-safeguard-20b", - "name": "Safety GPT OSS 20B", - "display_name": "Safety GPT OSS 20B", + "id": "qwen3-max-2025-09-23", + "name": "Qwen3 Max 20250923", + "display_name": "Qwen3 Max 20250923", "modalities": { "input": [ "text" @@ -139472,30 +147693,27 @@ ] }, "limit": { - "context": 131072, + "context": 262144, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { + "supported": false + }, + "search": { "supported": true, - "default": true + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "release_date": "2025-03-05", - "last_updated": "2025-03-05", - "cost": { - "input": 0.075, - "output": 0.3, - "cache_read": 0.037 - }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "qwen3-max-preview", + "name": "Qwen3 Max Preview", + "display_name": "Qwen3 Max Preview", "modalities": { "input": [ "text" @@ -139505,34 +147723,38 @@ ] }, "limit": { - "context": 131072, + "context": 262144, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 0.15, - "output": 0.6 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "qwen/qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ "text" @@ -139543,13 +147765,18 @@ }, "limit": { "context": 131072, - "output": 40960 + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { @@ -139563,20 +147790,12 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-11-08", - "release_date": "2024-12-23", - "last_updated": "2024-12-23", - "cost": { - "input": 0.29, - "output": 0.59 - }, "type": "chat" }, { - "id": "groq/compound", - "name": "Compound", - "display_name": "Compound", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -139587,29 +147806,20 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09-04", - "release_date": "2025-09-04", - "last_updated": "2025-09-04", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "groq/compound-mini", - "name": "Compound Mini", - "display_name": "Compound Mini", + "id": "qwen3-30b-a3b-instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ "text" @@ -139620,29 +147830,20 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09-04", - "release_date": "2025-09-04", - "last_updated": "2025-09-04", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "qwen3-30b-a3b-thinking-2507", + "name": "Qwen3 30B A3B Thinking 2507", + "display_name": "Qwen3 30B A3B Thinking 2507", "modalities": { "input": [ "text" @@ -139653,28 +147854,37 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-14", - "last_updated": "2025-07-14", - "cost": { - "input": 1, - "output": 3 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "moonshotai/kimi-k2-instruct-0905", - "name": "Kimi K2 Instruct 0905", - "display_name": "Kimi K2 Instruct 0905", + "id": "qwen3-30b-a3b", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ "text" @@ -139684,37 +147894,38 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", - "cost": { - "input": 1, - "output": 3 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" - } - ] - }, - "azure": { - "id": "azure", - "name": "Azure", - "display_name": "Azure", - "doc": "https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models", - "models": [ + }, { - "id": "mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "qwen3-4b", + "name": "Qwen3 4B", + "display_name": "Qwen3 4B", "modalities": { "input": [ "text" @@ -139724,64 +147935,79 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", - "cost": { - "input": 0.15, - "output": 0.15 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "gpt-5.2-chat", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", + "id": "qwen3-1.7b", + "name": "Qwen3 1.7B", + "display_name": "Qwen3 1.7B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 30720, + "min": 0, + "max": 30720 + } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", - "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "codex-mini", - "name": "Codex Mini", - "display_name": "Codex Mini", + "id": "qwen3-0.6b", + "name": "Qwen3 0.6B", + "display_name": "Qwen3 0.6B", "modalities": { "input": [ "text" @@ -139791,66 +148017,80 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 32768, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 30720, + "min": 0, + "max": 30720 + } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-16", - "last_updated": "2025-05-16", - "cost": { - "input": 1.5, - "output": 6, - "cache_read": 0.375 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "phi-4-multimodal", - "name": "Phi-4-multimodal", - "display_name": "Phi-4-multimodal", + "id": "qwen3-vl-plus-2025-09-23", + "name": "Qwen3 VL Plus 2025 09 23", + "display_name": "Qwen3 VL Plus 2025 09 23", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": true, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", - "cost": { - "input": 0.08, - "output": 0.32, - "input_audio": 4 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "phi-3.5-mini-instruct", - "name": "Phi-3.5-mini-instruct", - "display_name": "Phi-3.5-mini-instruct", + "id": "qwq-plus-latest", + "name": "QwQ Plus Latest", + "display_name": "QwQ Plus Latest", "modalities": { "input": [ "text" @@ -139860,29 +148100,85 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": false, "reasoning": { + "supported": true, + "default": true, + "budget": { + "default": 32768, + "min": 0, + "max": 32768 + } + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "type": "chat" + } + ] + }, + "302ai": { + "id": "302ai", + "name": "302.AI", + "display_name": "302.AI", + "api": "https://api.302.ai/v1", + "doc": "https://doc.302.ai", + "models": [ + { + "id": "claude-opus-4-1-20250805", + "name": "claude-opus-4-1-20250805", + "display_name": "claude-opus-4-1-20250805", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.13, - "output": 0.52 + "input": 15, + "output": 75 }, "type": "chat" }, { - "id": "llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout 17B 16E Instruct", - "display_name": "Llama 4 Scout 17B 16E Instruct", + "id": "mistral-large-2512", + "name": "mistral-large-2512", + "display_name": "mistral-large-2512", "modalities": { "input": [ "text", @@ -139894,7 +148190,7 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 262144 }, "temperature": true, "tool_call": true, @@ -139902,32 +148198,33 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 0.2, - "output": 0.78 + "input": 1.1, + "output": 3.3 }, "type": "chat" }, { - "id": "grok-4-1-fast-reasoning", - "name": "Grok 4.1 Fast (Reasoning)", - "display_name": "Grok 4.1 Fast (Reasoning)", + "id": "claude-haiku-4-5", + "name": "claude-haiku-4-5", + "display_name": "claude-haiku-4-5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -139942,19 +148239,19 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-06-27", - "last_updated": "2025-06-27", + "knowledge": "2025-02-28", + "release_date": "2025-10-16", + "last_updated": "2025-10-16", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "phi-3-medium-4k-instruct", - "name": "Phi-3-medium-instruct (4k)", - "display_name": "Phi-3-medium-instruct (4k)", + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -139964,32 +148261,37 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 1000000, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "open_weights": false, + "release_date": "2025-12-19", + "last_updated": "2025-12-19", "cost": { - "input": 0.17, - "output": 0.68 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "ministral-3b", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "chatgpt-4o-latest", + "name": "chatgpt-4o-latest", + "display_name": "chatgpt-4o-latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -139997,33 +148299,31 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-03", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-08-08", + "last_updated": "2024-08-08", "cost": { - "input": 0.04, - "output": 0.04 + "input": 5, + "output": 15 }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "glm-5.1", + "name": "glm-5.1", + "display_name": "glm-5.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -140031,7 +148331,7 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -140041,29 +148341,34 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-02-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2026-04-10", + "last_updated": "2026-04-10", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.86, + "output": 3.5 }, "type": "chat" }, { - "id": "meta-llama-3.1-8b-instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", + "id": "gpt-4o", + "name": "gpt-4o", + "display_name": "gpt-4o", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -140071,40 +148376,43 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0.3, - "output": 0.61 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "glm-5v-turbo", + "name": "GLM-5V-Turbo", + "display_name": "GLM-5V-Turbo", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -140123,85 +148431,105 @@ ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-06", - "last_updated": "2026-02-06", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.6, - "output": 3 + "input": 0.72, + "output": 3.2 }, "type": "chat" }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "gemini-3-pro-image-preview", + "name": "gemini-3-pro-image-preview", + "display_name": "gemini-3-pro-image-preview", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 32768, + "output": 64000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "cost": { - "input": 0.71, - "output": 0.71 + "input": 2, + "output": 120 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "deepseek-v3-0324", - "name": "DeepSeek-V3-0324", - "display_name": "DeepSeek-V3-0324", + "id": "claude-3-5-haiku-latest", + "name": "claude-3-5-haiku-latest", + "display_name": "claude-3-5-haiku-latest", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "attachment": true, + "open_weights": false, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 1.14, - "output": 4.56 + "input": 0.8, + "output": 4 }, "type": "chat" }, { - "id": "gpt-5-chat", - "name": "GPT-5 Chat", - "display_name": "GPT-5 Chat", + "id": "gpt-5.2", + "name": "gpt-5.2", + "display_name": "gpt-5.2", "modalities": { "input": [ "text", @@ -140212,31 +148540,52 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-10-24", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-08-31", + "release_date": "2025-12-12", + "last_updated": "2025-12-12", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "phi-3.5-moe-instruct", - "name": "Phi-3.5-MoE-instruct", - "display_name": "Phi-3.5-MoE-instruct", + "id": "deepseek-chat", + "name": "Deepseek-Chat", + "display_name": "Deepseek-Chat", "modalities": { "input": [ "text" @@ -140247,28 +148596,28 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-11-29", + "last_updated": "2024-11-29", "cost": { - "input": 0.16, - "output": 0.64 + "input": 0.29, + "output": 0.43 }, "type": "chat" }, { - "id": "gpt-5.3-chat", - "name": "GPT-5.3 Chat", - "display_name": "GPT-5.3 Chat", + "id": "gpt-5-thinking", + "name": "gpt-5-thinking", + "display_name": "gpt-5-thinking", "modalities": { "input": [ "text", @@ -140279,10 +148628,10 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -140290,33 +148639,33 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "knowledge": "2024-10", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "o1-mini", - "name": "o1-mini", - "display_name": "o1-mini", + "id": "gemini-2.5-flash-preview-09-2025", + "name": "gemini-2.5-flash-preview-09-2025", + "display_name": "gemini-2.5-flash-preview-09-2025", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 1000000, "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -140326,127 +148675,104 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "knowledge": "2025-01", + "release_date": "2025-09-26", + "last_updated": "2025-09-26", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "text-embedding-3-large", - "name": "text-embedding-3-large", - "display_name": "text-embedding-3-large", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8191, - "output": 3072 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", - "cost": { - "input": 0.13, - "output": 0 - }, - "type": "embedding" - }, - { - "id": "phi-3-mini-128k-instruct", - "name": "Phi-3-mini-instruct (128k)", - "display_name": "Phi-3-mini-instruct (128k)", + "id": "claude-haiku-4-5-20251001", + "name": "claude-haiku-4-5-20251001", + "display_name": "claude-haiku-4-5-20251001", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-16", + "last_updated": "2025-10-16", "cost": { - "input": 0.13, - "output": 0.52 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "phi-4-reasoning", - "name": "Phi-4-reasoning", - "display_name": "Phi-4-reasoning", + "id": "doubao-seed-code-preview-251028", + "name": "doubao-seed-code-preview-251028", + "display_name": "doubao-seed-code-preview-251028", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 256000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": true, + "open_weights": false, + "release_date": "2025-11-11", + "last_updated": "2025-11-11", "cost": { - "input": 0.125, - "output": 0.5 + "input": 0.17, + "output": 1.14 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "gpt-5.4-nano", + "name": "gpt-5.4-nano", + "display_name": "gpt-5.4-nano", "modalities": { "input": [ "text", @@ -140457,26 +148783,27 @@ ] }, "limit": { - "context": 272000, + "context": 400000, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ - "minimal", + "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -140489,20 +148816,19 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-08-31", + "release_date": "2026-03-19", + "last_updated": "2026-03-19", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 + "input": 0.2, + "output": 1.25 }, "type": "chat" }, { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "gemini-2.5-pro", + "name": "gemini-2.5-pro", + "display_name": "gemini-2.5-pro", "modalities": { "input": [ "text", @@ -140513,10 +148839,10 @@ ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 1000000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -140526,39 +148852,36 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "meta-llama-3-70b-instruct", - "name": "Meta-Llama-3-70B-Instruct", - "display_name": "Meta-Llama-3-70B-Instruct", + "id": "kimi-k2-0905-preview", + "name": "kimi-k2-0905-preview", + "display_name": "kimi-k2-0905-preview", "modalities": { "input": [ "text" @@ -140568,180 +148891,189 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 2.68, - "output": 3.54 + "input": 0.632, + "output": 2.53 }, "type": "chat" }, { - "id": "phi-3-small-8k-instruct", - "name": "Phi-3-small-instruct (8k)", - "display_name": "Phi-3-small-instruct (8k)", + "id": "grok-4-1-fast-reasoning", + "name": "grok-4-1-fast-reasoning", + "display_name": "grok-4-1-fast-reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 2000000, + "output": 30000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "release_date": "2026-03-19", + "last_updated": "2026-03-19", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "text-embedding-ada-002", - "name": "text-embedding-ada-002", - "display_name": "text-embedding-ada-002", + "id": "grok-4.20-multi-agent-beta-0309", + "name": "grok-4.20-multi-agent-beta-0309", + "display_name": "grok-4.20-multi-agent-beta-0309", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 2000000, + "output": 30000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2022-12-15", - "last_updated": "2022-12-15", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0.1, - "output": 0 + "input": 2, + "output": 6 }, - "type": "embedding" + "type": "chat" }, { - "id": "llama-3.2-90b-vision-instruct", - "name": "Llama-3.2-90B-Vision-Instruct", - "display_name": "Llama-3.2-90B-Vision-Instruct", + "id": "claude-sonnet-4-5-20250929-thinking", + "name": "claude-sonnet-4-5-20250929-thinking", + "display_name": "claude-sonnet-4-5-20250929-thinking", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 2.04, - "output": 2.04 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "deepseek-v3.2", + "name": "deepseek-v3.2", + "display_name": "deepseek-v3.2", "modalities": { "input": [ "text" @@ -140751,41 +149083,34 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 1.35, - "output": 5.4 + "input": 0.29, + "output": 0.43 }, "type": "chat" }, { "id": "grok-4-1-fast-non-reasoning", - "name": "Grok 4.1 Fast (Non-Reasoning)", - "display_name": "Grok 4.1 Fast (Non-Reasoning)", + "name": "grok-4-1-fast-non-reasoning", + "display_name": "grok-4-1-fast-non-reasoning", "modalities": { "input": [ "text", @@ -140796,8 +149121,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -140806,136 +149131,119 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-06-27", - "last_updated": "2025-06-27", + "knowledge": "2025-06", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "cost": { "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "output": 0.5 }, "type": "chat" }, { - "id": "deepseek-v3.2-speciale", - "name": "DeepSeek-V3.2-Speciale", - "display_name": "DeepSeek-V3.2-Speciale", + "id": "doubao-seed-1-6-vision-250815", + "name": "doubao-seed-1-6-vision-250815", + "display_name": "doubao-seed-1-6-vision-250815", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 256000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "attachment": true, + "open_weights": false, + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.58, - "output": 1.68 + "input": 0.114, + "output": 1.143 }, "type": "chat" }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "claude-sonnet-4-5", + "name": "claude-sonnet-4-5", + "display_name": "claude-sonnet-4-5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2025-07-31", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.125 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "mistral-large-2411", - "name": "Mistral Large 24.11", - "display_name": "Mistral Large 24.11", + "id": "grok-4.20-beta-0309-reasoning", + "name": "grok-4.20-beta-0309-reasoning", + "display_name": "grok-4.20-beta-0309-reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { "input": 2, "output": 6 @@ -140943,14 +149251,13 @@ "type": "chat" }, { - "id": "claude-opus-4-1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "claude-opus-4-1-20250805-thinking", + "name": "claude-opus-4-1-20250805-thinking", + "display_name": "claude-opus-4-1-20250805-thinking", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -140968,26 +149275,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2025-03", + "release_date": "2025-05-27", + "last_updated": "2025-05-27", "cost": { "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "output": 75 }, "type": "chat" }, { - "id": "cohere-command-a", - "name": "Command A", - "display_name": "Command A", + "id": "qwen-max-latest", + "name": "Qwen-Max-Latest", + "display_name": "Qwen-Max-Latest", "modalities": { "input": [ "text" @@ -140997,8 +149303,40 @@ ] }, "limit": { - "context": 256000, - "output": 8000 + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2024-04-03", + "last_updated": "2025-01-25", + "cost": { + "input": 0.343, + "output": 1.372 + }, + "type": "chat" + }, + { + "id": "glm-4.7-flashx", + "name": "glm-4.7-flashx", + "display_name": "glm-4.7-flashx", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -141008,52 +149346,80 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "knowledge": "2025-04", + "release_date": "2026-01-20", + "last_updated": "2026-01-20", "cost": { - "input": 2.5, - "output": 10 + "input": 0.0715, + "output": 0.429 }, "type": "chat" }, { - "id": "llama-3.2-11b-vision-instruct", - "name": "Llama-3.2-11B-Vision-Instruct", - "display_name": "Llama-3.2-11B-Vision-Instruct", + "id": "claude-opus-4-6-thinking", + "name": "claude-opus-4-6-thinking", + "display_name": "claude-opus-4-6-thinking", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2026-02-06", + "last_updated": "2026-03-13", "cost": { - "input": 0.37, - "output": 0.37 + "input": 5, + "output": 25 }, "type": "chat" }, { - "id": "meta-llama-3.1-405b-instruct", - "name": "Meta-Llama-3.1-405B-Instruct", - "display_name": "Meta-Llama-3.1-405B-Instruct", + "id": "glm-4.5-airx", + "name": "glm-4.5-airx", + "display_name": "glm-4.5-airx", "modalities": { "input": [ "text" @@ -141064,7 +149430,7 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -141072,58 +149438,53 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 5.33, - "output": 16 + "input": 0.572, + "output": 1.714 }, "type": "chat" }, { - "id": "gpt-5.1-chat", - "name": "GPT-5.1 Chat", - "display_name": "GPT-5.1 Chat", + "id": "glm-4.5-air", + "name": "glm-4.5-air", + "display_name": "glm-4.5-air", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 98304 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.1143, + "output": 0.286 }, "type": "chat" }, { - "id": "gpt-4-turbo-vision", - "name": "GPT-4 Turbo Vision", - "display_name": "GPT-4 Turbo Vision", + "id": "gpt-5.1-chat-latest", + "name": "gpt-5.1-chat-latest", + "display_name": "gpt-5.1-chat-latest", "modalities": { "input": [ "text", @@ -141135,204 +149496,223 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 10, - "output": 30 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "qwen3-235b-a22b", + "name": "Qwen3-235B-A22B", + "display_name": "Qwen3-235B-A22B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "knowledge": "2025-04", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.29, + "output": 2.86 }, "type": "chat" }, { - "id": "cohere-embed-v-4-0", - "name": "Embed v4", - "display_name": "Embed v4", + "id": "glm-4.5v", + "name": "GLM-4.5V", + "display_name": "GLM-4.5V", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 1536 + "context": 64000, + "output": 16384 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": true, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "knowledge": "2025-04", + "release_date": "2025-08-12", + "last_updated": "2025-08-12", "cost": { - "input": 0.12, - "output": 0 + "input": 0.29, + "output": 0.86 }, "type": "chat" }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex Mini", - "display_name": "GPT-5.1 Codex Mini", + "id": "qwen-flash", + "name": "Qwen-Flash", + "display_name": "Qwen-Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.022, + "output": 0.22 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-0125", - "name": "GPT-3.5 Turbo 0125", - "display_name": "GPT-3.5 Turbo 0125", + "id": "gemini-3.1-flash-image-preview", + "name": "gemini-3.1-flash-image-preview", + "display_name": "gemini-3.1-flash-image-preview", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2021-08", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "knowledge": "2025-01", + "release_date": "2026-02-27", + "last_updated": "2026-02-27", "cost": { "input": 0.5, - "output": 1.5 + "output": 60 + }, + "type": "imageGeneration" + }, + { + "id": "gpt-4.1", + "name": "gpt-4.1", + "display_name": "gpt-4.1", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1047576, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "o1-preview", - "name": "o1-preview", - "display_name": "o1-preview", + "id": "glm-4.6", + "name": "glm-4.6", + "display_name": "glm-4.6", "modalities": { "input": [ "text" @@ -141342,10 +149722,10 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -141353,34 +149733,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": false, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 16.5, - "output": 66, - "cache_read": 8.25 + "input": 0.286, + "output": 1.142 }, "type": "chat" }, { - "id": "cohere-embed-v3-multilingual", - "name": "Embed v3 Multilingual", - "display_name": "Embed v3 Multilingual", + "id": "glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -141390,79 +149760,74 @@ ] }, "limit": { - "context": 512, - "output": 1024 + "context": 131072, + "output": 98304 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 0.1, - "output": 0 + "input": 0.286, + "output": 1.142 }, "type": "chat" }, { - "id": "grok-4-20-non-reasoning", - "name": "Grok 4.20 (Non-Reasoning)", - "display_name": "Grok 4.20 (Non-Reasoning)", + "id": "ministral-14b-2512", + "name": "ministral-14b-2512", + "display_name": "ministral-14b-2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "knowledge": "2024-12", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 2, - "output": 6 + "input": 0.33, + "output": 0.33 }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "gpt-5.4-nano-2026-03-17", + "name": "gpt-5.4-nano-2026-03-17", + "display_name": "gpt-5.4-nano-2026-03-17", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 272000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -141481,7 +149846,8 @@ "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -141489,25 +149855,85 @@ "medium", "high" ], - "visibility": "hidden" + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-19", + "last_updated": "2026-03-19", + "cost": { + "input": 0.2, + "output": 1.25 + }, + "type": "chat" + }, + { + "id": "claude-sonnet-4-6", + "name": "claude-sonnet-4-6", + "display_name": "claude-sonnet-4-6", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "knowledge": "2025-08-31", + "release_date": "2026-02-18", + "last_updated": "2026-03-13", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "grok-4-fast-reasoning", - "name": "Grok 4 Fast (Reasoning)", - "display_name": "Grok 4 Fast (Reasoning)", + "id": "gpt-5-pro", + "name": "gpt-5-pro", + "display_name": "gpt-5-pro", "modalities": { "input": [ "text", @@ -141518,10 +149944,10 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 400000, + "output": 272000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -141529,39 +149955,47 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "knowledge": "2024-09-30", + "release_date": "2025-10-08", + "last_updated": "2025-10-08", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "o1", - "name": "o1", - "display_name": "o1", + "id": "deepseek-reasoner", + "name": "Deepseek-Reasoner", + "display_name": "Deepseek-Reasoner", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -141570,44 +150004,41 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.29, + "output": 0.43 }, "type": "chat" }, { - "id": "mistral-small-2503", - "name": "Mistral Small 3.1", - "display_name": "Mistral Small 3.1", + "id": "gpt-4.1-mini", + "name": "gpt-4.1-mini", + "display_name": "gpt-4.1-mini", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 1047576, "output": 32768 }, "temperature": true, @@ -141617,23 +150048,22 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.4, + "output": 1.6 }, "type": "chat" }, { - "id": "model-router", - "name": "Model Router", - "display_name": "Model Router", + "id": "deepseek-v3.2-thinking", + "name": "DeepSeek-V3.2-Thinking", + "display_name": "DeepSeek-V3.2-Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -141641,99 +150071,126 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-19", - "last_updated": "2025-11-18", + "knowledge": "2024-12", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.14, - "output": 0 + "input": 0.29, + "output": 0.43 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-1106", - "name": "GPT-3.5 Turbo 1106", - "display_name": "GPT-3.5 Turbo 1106", + "id": "doubao-seed-1-8-251215", + "name": "doubao-seed-1-8-251215", + "display_name": "doubao-seed-1-8-251215", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 224000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-11-06", - "last_updated": "2023-11-06", + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "cost": { - "input": 1, - "output": 2 + "input": 0.114, + "output": 0.286 }, "type": "chat" }, { - "id": "text-embedding-3-small", - "name": "text-embedding-3-small", - "display_name": "text-embedding-3-small", + "id": "gemini-2.5-flash-lite-preview-09-2025", + "name": "gemini-2.5-flash-lite-preview-09-2025", + "display_name": "gemini-2.5-flash-lite-preview-09-2025", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8191, - "output": 1536 + "context": 1000000, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "knowledge": "2025-01", + "release_date": "2025-09-26", + "last_updated": "2025-09-26", "cost": { - "input": 0.02, - "output": 0 + "input": 0.1, + "output": 0.4 }, - "type": "embedding" + "type": "chat" }, { - "id": "deepseek-v3.1", - "name": "DeepSeek-V3.1", - "display_name": "DeepSeek-V3.1", + "id": "gemini-3-pro-preview", + "name": "gemini-3-pro-preview", + "display_name": "gemini-3-pro-preview", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -141741,63 +150198,93 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "cost": { - "input": 0.56, - "output": 1.68 + "input": 2, + "output": 12 }, "type": "chat" }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "gpt-5.1", + "name": "gpt-5.1", + "display_name": "gpt-5.1", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "phi-3-mini-4k-instruct", - "name": "Phi-3-mini-instruct (4k)", - "display_name": "Phi-3-mini-instruct (4k)", + "id": "qwen3-max-2025-09-23", + "name": "qwen3-max-2025-09-23", + "display_name": "qwen3-max-2025-09-23", "modalities": { "input": [ "text" @@ -141807,72 +150294,149 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 258048, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 0.13, - "output": 0.52 + "input": 0.86, + "output": 3.43 }, "type": "chat" }, { - "id": "meta-llama-3.1-70b-instruct", - "name": "Meta-Llama-3.1-70B-Instruct", - "display_name": "Meta-Llama-3.1-70B-Instruct", + "id": "gpt-5.4", + "name": "gpt-5.4", + "display_name": "gpt-5.4", "modalities": { "input": [ + "text", + "image", + "pdf" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 1050000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", + "cost": { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "cache_write": 0, + "tiers": [ + { + "input": 5, + "output": 22.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 5, + "output": 22.5 + } + }, + "type": "chat" + }, + { + "id": "claude-3-5-haiku-20241022", + "name": "claude-3-5-haiku-20241022", + "display_name": "claude-3-5-haiku-20241022", + "modalities": { + "input": [ + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "attachment": true, + "open_weights": false, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 2.68, - "output": 3.54 + "input": 0.8, + "output": 4 }, "type": "chat" }, { - "id": "phi-4-mini-reasoning", - "name": "Phi-4-mini-reasoning", - "display_name": "Phi-4-mini-reasoning", + "id": "claude-opus-4-5-20251101", + "name": "claude-opus-4-5-20251101", + "display_name": "claude-opus-4-5-20251101", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -141880,21 +150444,21 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-25", + "last_updated": "2025-11-25", "cost": { - "input": 0.075, - "output": 0.3 + "input": 5, + "output": 25 }, "type": "chat" }, { - "id": "gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "kimi-k2-thinking", + "name": "kimi-k2-thinking", + "display_name": "kimi-k2-thinking", "modalities": { "input": [ "text" @@ -141904,73 +150468,87 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", + "knowledge": "2025-06", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 60, - "output": 120 + "input": 0.575, + "output": 2.3 }, "type": "chat" }, { - "id": "meta-llama-3-8b-instruct", - "name": "Meta-Llama-3-8B-Instruct", - "display_name": "Meta-Llama-3-8B-Instruct", + "id": "gemini-2.0-flash-lite", + "name": "gemini-2.0-flash-lite", + "display_name": "gemini-2.0-flash-lite", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 2000000, + "output": 8192 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "attachment": true, + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-06-16", + "last_updated": "2025-06-16", "cost": { - "input": 0.3, - "output": 0.61 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "claude-opus-4-20250514", + "name": "claude-opus-4-20250514", + "display_name": "claude-opus-4-20250514", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -141978,27 +150556,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.95, - "output": 4 + "input": 15, + "output": 75 }, "type": "chat" }, { - "id": "gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "gpt-5.4-mini", + "name": "gpt-5.4-mini", + "display_name": "gpt-5.4-mini", "modalities": { "input": [ "text", @@ -142016,19 +150588,20 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ - "minimal", + "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -142039,22 +150612,21 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2025-08-31", + "release_date": "2026-03-19", + "last_updated": "2026-03-19", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.75, + "output": 4.5 }, "type": "chat" }, { - "id": "phi-4-mini", - "name": "Phi-4-mini", - "display_name": "Phi-4-mini", + "id": "kimi-k2-thinking-turbo", + "name": "kimi-k2-thinking-turbo", + "display_name": "kimi-k2-thinking-turbo", "modalities": { "input": [ "text" @@ -142064,40 +150636,43 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.075, - "output": 0.3 + "input": 1.265, + "output": 9.119 }, "type": "chat" }, { - "id": "grok-4-20-reasoning", - "name": "Grok 4.20 (Reasoning)", - "display_name": "Grok 4.20 (Reasoning)", + "id": "claude-sonnet-4-5-20250929", + "name": "claude-sonnet-4-5-20250929", + "display_name": "claude-sonnet-4-5-20250929", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -142105,229 +150680,216 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "knowledge": "2025-07-31", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 2, - "output": 6 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-0301", - "name": "GPT-3.5 Turbo 0301", - "display_name": "GPT-3.5 Turbo 0301", + "id": "grok-4.1", + "name": "grok-4.1", + "display_name": "grok-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-03-01", - "last_updated": "2023-03-01", + "knowledge": "2025-06", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 1.5, - "output": 2 + "input": 2, + "output": 10 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "qwen3-30b-a3b", + "name": "Qwen3-30B-A3B", + "display_name": "Qwen3-30B-A3B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2025-04", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25, - "context_over_200k": { - "input": 10, - "output": 37.5, - "cache_read": 1, - "cache_write": 12.5 - } + "input": 0.11, + "output": 1.08 }, "type": "chat" }, { - "id": "phi-3-small-128k-instruct", - "name": "Phi-3-small-instruct (128k)", - "display_name": "Phi-3-small-instruct (128k)", + "id": "claude-opus-4-5-20251101-thinking", + "name": "claude-opus-4-5-20251101-thinking", + "display_name": "claude-opus-4-5-20251101-thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-11-25", + "last_updated": "2025-11-25", "cost": { - "input": 0.15, - "output": 0.6 + "input": 5, + "output": 25 }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "claude-opus-4-7", + "name": "claude-opus-4-7", + "display_name": "claude-opus-4-7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 1000000, "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.58, - "output": 1.68 - }, - "type": "chat" - }, - { - "id": "phi-3-medium-128k-instruct", - "name": "Phi-3-medium-instruct (128k)", - "display_name": "Phi-3-medium-instruct (128k)", - "modalities": { - "input": [ - "text" + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "tiers": [ + { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5, + "tier": { + "type": "context", + "size": 200000 + } + } ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 4096 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", - "cost": { - "input": 0.17, - "output": 0.68 + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5 + } }, "type": "chat" }, { - "id": "gpt-3.5-turbo-0613", - "name": "GPT-3.5 Turbo 0613", - "display_name": "GPT-3.5 Turbo 0613", + "id": "glm-5-turbo", + "name": "glm-5-turbo", + "display_name": "glm-5-turbo", "modalities": { "input": [ "text" @@ -142337,48 +150899,57 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 200000, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-06-13", - "last_updated": "2023-06-13", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 3, - "output": 4 + "input": 0.72, + "output": 3.2 }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "grok-4.20-beta-0309-non-reasoning", + "name": "grok-4.20-beta-0309-non-reasoning", + "display_name": "grok-4.20-beta-0309-non-reasoning", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -142387,21 +150958,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "phi-4", - "name": "Phi-4", - "display_name": "Phi-4", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "qwen3-235b-a22b-instruct-2507", + "display_name": "qwen3-235b-a22b-instruct-2507", "modalities": { "input": [ "text" @@ -142412,28 +150980,28 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { - "input": 0.125, - "output": 0.5 + "input": 0.29, + "output": 1.143 }, "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "gemini-3-flash-preview", + "name": "gemini-3-flash-preview", + "display_name": "gemini-3-flash-preview", "modalities": { "input": [ "text", @@ -142444,10 +151012,10 @@ ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 1000000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -142457,135 +151025,106 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ + "mode": "level", + "level": "high", + "level_options": [ "minimal", "low", "medium", "high" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 - }, - "type": "chat" - }, - { - "id": "gpt-4-32k", - "name": "GPT-4 32K", - "display_name": "GPT-4 32K", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32768, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", - "cost": { - "input": 60, - "output": 120 - }, - "type": "chat" - }, - { - "id": "cohere-embed-v3-english", - "name": "Embed v3 English", - "display_name": "Embed v3 English", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 512, - "output": 1024 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", + "knowledge": "2025-06", + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "cost": { - "input": 0.1, - "output": 0 + "input": 0.5, + "output": 3 }, "type": "chat" }, { - "id": "phi-4-reasoning-plus", - "name": "Phi-4-reasoning-plus", - "display_name": "Phi-4-reasoning-plus", + "id": "gpt-5.4-pro", + "name": "gpt-5.4-pro", + "display_name": "gpt-5.4-pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 1050000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.125, - "output": 0.5 + "input": 30, + "output": 180, + "cache_read": 0, + "cache_write": 0, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 60, + "output": 270 + } }, "type": "chat" }, { - "id": "mistral-medium-2505", - "name": "Mistral Medium 3", - "display_name": "Mistral Medium 3", + "id": "gpt-5.2-chat-latest", + "name": "gpt-5.2-chat-latest", + "display_name": "gpt-5.2-chat-latest", "modalities": { "input": [ "text", @@ -142597,28 +151136,29 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "knowledge": "2025-08-31", + "release_date": "2025-12-12", + "last_updated": "2025-12-12", "cost": { - "input": 0.4, - "output": 2 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-instruct", - "name": "GPT-3.5 Turbo Instruct", - "display_name": "GPT-3.5 Turbo Instruct", + "id": "MiniMax-M2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ "text" @@ -142628,29 +151168,39 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-09-21", - "last_updated": "2023-09-21", + "release_date": "2026-03-19", + "last_updated": "2026-03-19", "cost": { - "input": 1.5, - "output": 2 + "input": 0.6, + "output": 4.8 }, "type": "chat" }, { - "id": "deepseek-r1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "qwen3-coder-480b-a35b-instruct", + "display_name": "qwen3-coder-480b-a35b-instruct", "modalities": { "input": [ "text" @@ -142660,96 +151210,69 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 1.35, - "output": 5.4 + "input": 0.86, + "output": 3.43 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "gpt-4.1-nano", + "name": "gpt-4.1-nano", + "display_name": "gpt-4.1-nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-12-02", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "gpt-5.4-mini-2026-03-17", + "name": "gpt-5.4-mini-2026-03-17", + "display_name": "gpt-5.4-mini-2026-03-17", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { @@ -142772,7 +151295,8 @@ "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -142783,22 +151307,21 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "knowledge": "2025-08-31", + "release_date": "2026-03-19", + "last_updated": "2026-03-19", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.75, + "output": 4.5 }, "type": "chat" }, { - "id": "codestral-2501", - "name": "Codestral 25.01", - "display_name": "Codestral 25.01", + "id": "MiniMax-M1", + "name": "MiniMax-M1", + "display_name": "MiniMax-M1", "modalities": { "input": [ "text" @@ -142808,8 +151331,8 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -142818,19 +151341,18 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-06-16", + "last_updated": "2025-06-16", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.132, + "output": 1.254 }, "type": "chat" }, { - "id": "llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama 4 Maverick 17B 128E Instruct FP8", - "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", + "id": "gemini-2.5-flash", + "name": "gemini-2.5-flash", + "display_name": "gemini-2.5-flash", "modalities": { "input": [ "text", @@ -142841,62 +151363,83 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.25, - "output": 1 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "mai-ds-r1", - "name": "MAI-DS-R1", - "display_name": "MAI-DS-R1", + "id": "gemini-2.5-flash-image", + "name": "gemini-2.5-flash-image", + "display_name": "gemini-2.5-flash-image", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2025-01", + "release_date": "2025-10-08", + "last_updated": "2025-10-08", "cost": { - "input": 1.35, - "output": 5.4 + "input": 0.3, + "output": 30 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "gpt-5-mini", + "name": "gpt-5-mini", + "display_name": "gpt-5-mini", "modalities": { "input": [ "text", @@ -142914,16 +151457,16 @@ "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", + "minimal", "low", "medium", "high" @@ -142939,20 +151482,19 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2024-05-30", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "claude-opus-4-6", + "name": "claude-opus-4-6", + "display_name": "claude-opus-4-6", "modalities": { "input": [ "text", @@ -142965,7 +151507,7 @@ }, "limit": { "context": 1000000, - "output": 64000 + "output": 128000 }, "temperature": true, "tool_call": true, @@ -143001,240 +151543,199 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", + "knowledge": "2025-05-31", + "release_date": "2026-02-06", "last_updated": "2026-03-13", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 5, + "output": 25 }, "type": "chat" }, { - "id": "gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "doubao-seed-1-6-thinking-250715", + "name": "doubao-seed-1-6-thinking-250715", + "display_name": "doubao-seed-1-6-thinking-250715", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 256000, + "output": 16000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2025-07-15", + "last_updated": "2025-07-15", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 0.121, + "output": 1.21 }, "type": "chat" }, { - "id": "gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "glm-4.7", + "name": "glm-4.7", + "display_name": "glm-4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 10, - "output": 30 + "input": 0.286, + "output": 1.142 }, "type": "chat" }, { - "id": "gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "glm-for-coding", + "name": "glm-for-coding", + "display_name": "glm-for-coding", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "input": 0.086, + "output": 0.343 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 Mini", - "display_name": "GPT-5.4 Mini", + "id": "MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "release_date": "2025-10-26", + "last_updated": "2025-10-26", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 0.33, + "output": 1.32 }, "type": "chat" }, { - "id": "cohere-command-r-08-2024", - "name": "Command R", - "display_name": "Command R", + "id": "claude-sonnet-4-20250514", + "name": "claude-sonnet-4-20250514", + "display_name": "claude-sonnet-4-20250514", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.15, - "output": 0.6 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "gemini-2.5-flash-nothink", + "name": "gemini-2.5-flash-nothink", + "display_name": "gemini-2.5-flash-nothink", "modalities": { "input": [ "text", @@ -143245,10 +151746,10 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1000000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -143258,187 +151759,145 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2025-01", + "release_date": "2025-06-24", + "last_updated": "2025-06-24", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "gpt-5.4-nano", - "name": "GPT-5.4 Nano", - "display_name": "GPT-5.4 Nano", + "id": "glm-4.5-x", + "name": "glm-4.5-x", + "display_name": "glm-4.5-x", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 1.143, + "output": 2.29 }, "type": "chat" }, { - "id": "grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "grok-4-fast-non-reasoning", + "name": "grok-4-fast-non-reasoning", + "display_name": "grok-4-fast-non-reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "knowledge": "2025-06", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "output": 0.5 }, "type": "chat" }, { - "id": "gpt-5.4-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "qwen-plus", + "name": "Qwen-Plus", + "display_name": "Qwen-Plus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 1000000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2024-10", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 30, - "output": 180, - "context_over_200k": { - "input": 60, - "output": 270 - } + "input": 0.12, + "output": 1.2 }, "type": "chat" }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "glm-5", + "name": "glm-5", + "display_name": "glm-5", "modalities": { "input": [ "text" @@ -143448,10 +151907,10 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -143460,44 +151919,40 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.6, + "output": 2.6 }, "type": "chat" }, { - "id": "grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "grok-4-fast-reasoning", + "name": "grok-4-fast-reasoning", + "display_name": "grok-4-fast-reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -143510,23 +151965,21 @@ "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "knowledge": "2025-06", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 3, - "output": 15, - "reasoning": 15, - "cache_read": 0.75 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "claude-opus-4-5", + "name": "claude-opus-4-5", + "display_name": "claude-opus-4-5", "modalities": { "input": [ "text", @@ -143538,141 +151991,85 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2025-03-31", + "release_date": "2025-11-25", + "last_updated": "2025-11-25", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "input": 5, + "output": 25 }, "type": "chat" }, { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1047576, + "context": 128000, "output": 32768 }, "temperature": true, "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.03 - }, - "type": "chat" - }, - { - "id": "grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 - }, - "temperature": true, - "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "attachment": true, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.3, - "output": 0.5, - "reasoning": 0.5, - "cache_read": 0.075 + "input": 0.145, + "output": 0.43 }, "type": "chat" }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "claude-sonnet-4-6-thinking", + "name": "claude-sonnet-4-6-thinking", + "display_name": "claude-sonnet-4-6-thinking", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1000000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -143682,32 +152079,43 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, "effort": "medium", "effort_options": [ "low", "medium", "high" ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2025-08", + "release_date": "2026-02-18", + "last_updated": "2026-03-13", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "gpt-5-pro", - "name": "GPT-5 Pro", - "display_name": "GPT-5 Pro", + "id": "gpt-5", + "name": "gpt-5", + "display_name": "gpt-5", "modalities": { "input": [ "text", @@ -143719,7 +152127,7 @@ }, "limit": { "context": 400000, - "output": 272000 + "output": 128000 }, "temperature": false, "tool_call": true, @@ -143731,8 +152139,14 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "fixed", - "effort": "high", + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], "verbosity": "medium", "verbosity_options": [ "low", @@ -143745,52 +152159,71 @@ "attachment": true, "open_weights": false, "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 15, - "output": 120 + "input": 1.25, + "output": 10 }, "type": "chat" - }, + } + ] + }, + "xpersona": { + "id": "xpersona", + "name": "Xpersona", + "display_name": "Xpersona", + "api": "https://www.xpersona.co/v1", + "doc": "https://www.xpersona.co/docs", + "models": [ { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "xpersona-frieren-coder", + "name": "Xpersona Frieren Coder", + "display_name": "Xpersona Frieren Coder", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "knowledge": "2025-12-30", + "release_date": "2026-05-01", + "last_updated": "2026-05-15", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 1.5, + "output": 6, + "reasoning": 6, + "cache_read": 0.15 }, "type": "chat" - }, + } + ] + }, + "stepfun": { + "id": "stepfun", + "name": "StepFun", + "display_name": "StepFun", + "api": "https://api.stepfun.com/v1", + "doc": "https://platform.stepfun.com/docs/zh/overview/concept", + "models": [ { - "id": "cohere-command-r-plus-08-2024", - "name": "Command R+", - "display_name": "Command R+", + "id": "step-1-32k", + "name": "Step 1 (32K)", + "display_name": "Step 1 (32K)", "modalities": { "input": [ "text" @@ -143800,97 +152233,99 @@ ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2025-01-01", + "last_updated": "2026-02-13", "cost": { - "input": 2.5, - "output": 10 + "input": 2.05, + "output": 9.59, + "cache_read": 0.41 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "step-2-16k", + "name": "Step 2 (16K)", + "display_name": "Step 2 (16K)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 16384, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-06", + "release_date": "2025-01-01", + "last_updated": "2026-02-13", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 5.21, + "output": 16.44, + "cache_read": 1.04 }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "step-3.5-flash-2603", + "name": "Step 3.5 Flash 2603", + "display_name": "Step 3.5 Flash 2603", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0.1, + "output": 0.3, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "step-3.5-flash", + "name": "Step 3.5 Flash", + "display_name": "Step 3.5 Flash", "modalities": { "input": [ "text" @@ -143900,30 +152335,39 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-29", + "last_updated": "2026-02-13", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0.096, + "output": 0.288, + "cache_read": 0.019 }, "type": "chat" - }, + } + ] + }, + "xai": { + "id": "xai", + "name": "xai", + "display_name": "xai", + "doc": "https://docs.x.ai/docs/models", + "models": [ { - "id": "grok-4-fast-non-reasoning", - "name": "Grok 4 Fast (Non-Reasoning)", - "display_name": "Grok 4 Fast (Non-Reasoning)", + "id": "grok-4.20-0309-non-reasoning", + "name": "Grok 4.20 (Non-Reasoning)", + "display_name": "Grok 4.20 (Non-Reasoning)", "modalities": { "input": [ "text", @@ -143944,40 +152388,47 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "release_date": "2026-03-09", + "last_updated": "2026-03-09", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 2, + "output": 6, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 12, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 12, + "cache_read": 0.4 + } }, "type": "chat" - } - ] - }, - "fastrouter": { - "id": "fastrouter", - "name": "FastRouter", - "display_name": "FastRouter", - "api": "https://go.fastrouter.ai/api/v1", - "doc": "https://fastrouter.ai/models", - "models": [ + }, { - "id": "x-ai/grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "grok-4.20-0309-reasoning", + "name": "Grok 4.20 (Reasoning)", + "display_name": "Grok 4.20 (Reasoning)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -143985,66 +152436,71 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2026-03-09", + "last_updated": "2026-03-09", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75, - "cache_write": 15 + "input": 2, + "output": 6, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 12, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 12, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "grok-vision-beta", + "name": "Grok Vision Beta", + "display_name": "Grok Vision Beta", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 8192, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-01-23", - "last_updated": "2025-01-23", + "attachment": true, + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.03, - "output": 0.14 + "input": 5, + "output": 15, + "cache_read": 5 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "grok-2-vision-1212", + "name": "Grok 2 Vision 1212", + "display_name": "Grok 2 Vision 1212", "modalities": { "input": [ "text", @@ -144055,108 +152511,61 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32000, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "search": { + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-08", + "release_date": "2024-08-20", + "last_updated": "2024-12-12", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 2, + "output": 10, + "cache_read": 2 }, "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "grok-imagine-image-quality", + "name": "Grok Imagine Image Quality", + "display_name": "Grok Imagine Image Quality", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1024, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 - }, + "release_date": "2026-04", + "last_updated": "2026-05-16", "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "grok-2-1212", + "name": "Grok 2 1212", + "display_name": "Grok 2 1212", "modalities": { "input": [ "text" @@ -144166,127 +152575,95 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 120000, + "output": 100000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "search": { + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-12-12", + "last_updated": "2024-12-12", "cost": { - "input": 0.05, - "output": 0.2 + "input": 2, + "output": 10, + "cache_read": 2 }, "type": "chat" }, { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "grok-beta", + "name": "Grok Beta", + "display_name": "Grok Beta", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-08", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 5, + "output": 15, + "cache_read": 5 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "grok-imagine-video", + "name": "Grok Imagine Video", + "display_name": "Grok Imagine Video", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1024, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 0.15, - "output": 0.6 + "supported": false }, + "attachment": true, + "open_weights": false, + "release_date": "2026-03", + "last_updated": "2026-05-16", "type": "chat" }, { - "id": "z-ai/glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "grok-2", + "name": "Grok 2", + "display_name": "Grok 2", "modalities": { "input": [ "text" @@ -144296,140 +152673,104 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.95, - "output": 3.15 + "input": 2, + "output": 10, + "cache_read": 2 }, "type": "chat" }, { - "id": "qwen/qwen3-coder", - "name": "Qwen3 Coder", - "display_name": "Qwen3 Coder", + "id": "grok-2-vision-latest", + "name": "Grok 2 Vision Latest", + "display_name": "Grok 2 Vision Latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 8192, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "attachment": true, + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-08-20", + "last_updated": "2024-12-12", "cost": { - "input": 0.3, - "output": 1.2 + "input": 2, + "output": 10, + "cache_read": 2 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "grok-imagine-image", + "name": "Grok Imagine Image", + "display_name": "Grok Imagine Image", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1024, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 - }, + "release_date": "2026-03", + "last_updated": "2026-05-16", "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "grok-4.3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -144439,284 +152780,275 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "release_date": "2026-05-01", + "last_updated": "2026-05-01", "cost": { - "input": 0.3, + "input": 1.25, "output": 2.5, - "cache_read": 0.0375 + "cache_read": 0.2, + "tiers": [ + { + "input": 2.5, + "output": 5, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 5, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "moonshotai/kimi-k2", - "name": "Kimi K2", - "display_name": "Kimi K2", + "id": "grok-2-vision", + "name": "Grok 2 Vision", + "display_name": "Grok 2 Vision", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 8192, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "attachment": true, + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.55, - "output": 2.2 + "input": 2, + "output": 10, + "cache_read": 2 }, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "grok-2-latest", + "name": "Grok 2 Latest", + "display_name": "Grok 2 Latest", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-08", + "release_date": "2024-08-20", + "last_updated": "2024-12-12", "cost": { "input": 2, - "output": 8, - "cache_read": 0.5 + "output": 10, + "cache_read": 2 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "grok-4.20-multi-agent-0309", + "name": "Grok 4.20 Multi-Agent", + "display_name": "Grok 4.20 Multi-Agent", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 2000000, + "output": 30000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-03-09", + "last_updated": "2026-03-09", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 2, + "output": 6, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 12, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 12, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "grok-3-mini-fast-beta", + "name": "Grok 3 Mini Fast Beta", + "display_name": "Grok 3 Mini Fast Beta", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 120000, + "output": 100000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "effort": "low" }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "search": { + "supported": false }, + "attachment": false, "type": "chat" - } - ] - }, - "stackit": { - "id": "stackit", - "name": "STACKIT", - "display_name": "STACKIT", - "api": "https://api.openai-compat.model-serving.eu01.onstackit.cloud/v1", - "doc": "https://docs.stackit.cloud/products/data-and-ai/ai-model-serving/basics/available-shared-models", - "models": [ + }, { - "id": "Qwen/Qwen3-VL-Embedding-8B", - "name": "Qwen3-VL Embedding 8B", - "display_name": "Qwen3-VL Embedding 8B", + "id": "grok-3-mini-beta", + "name": "Grok 3 Mini Beta", + "display_name": "Grok 3 Mini Beta", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 120000, + "output": 100000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "effort": "low" }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", - "cost": { - "input": 0.09, - "output": 0.09 + "search": { + "supported": false }, + "attachment": false, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-235B-A22B-Instruct-FP8", - "name": "Qwen3-VL 235B", - "display_name": "Qwen3-VL 235B", + "id": "grok-3-fast-beta", + "name": "Grok 3 Fast Beta", + "display_name": "Grok 3 Fast Beta", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 218000, - "output": 8192 + "context": 120000, + "output": 100000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2024-11-01", - "last_updated": "2024-11-01", - "cost": { - "input": 1.64, - "output": 1.91 + "search": { + "supported": false }, + "attachment": false, "type": "chat" }, { - "id": "neuralmagic/Meta-Llama-3.1-8B-Instruct-FP8", - "name": "Llama 3.1 8B", - "display_name": "Llama 3.1 8B", + "id": "grok-2-image-1212", + "name": "Grok 2 Image 1212", + "display_name": "Grok 2 Image 1212", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 130000, + "output": 100000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 0.16, - "output": 0.27 + "search": { + "supported": false }, + "attachment": false, "type": "chat" }, { - "id": "neuralmagic/Mistral-Nemo-Instruct-2407-FP8", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "grok-3-beta", + "name": "Grok 3 Beta", + "display_name": "Grok 3 Beta", "modalities": { "input": [ "text" @@ -144726,28 +153058,33 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 120000, + "output": 100000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", - "cost": { - "input": 0.49, - "output": 0.71 + "search": { + "supported": false }, + "attachment": false, "type": "chat" - }, + } + ] + }, + "sarvam": { + "id": "sarvam", + "name": "Sarvam AI", + "display_name": "Sarvam AI", + "api": "https://api.sarvam.ai/v1", + "doc": "https://docs.sarvam.ai/api-reference-docs/getting-started/models", + "models": [ { - "id": "openai/gpt-oss-120b", - "name": "GPT-OSS 120B", - "display_name": "GPT-OSS 120B", + "id": "sarvam-30b", + "name": "Sarvam-30B", + "display_name": "Sarvam-30B", "modalities": { "input": [ "text" @@ -144757,8 +153094,8 @@ ] }, "limit": { - "context": 131000, - "output": 8192 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -144768,23 +153105,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 0.49, - "output": 0.71 - }, + "release_date": "2026-02-18", + "last_updated": "2026-03-06", "type": "chat" }, { - "id": "cortecs/Llama-3.3-70B-Instruct-FP8-Dynamic", - "name": "Llama 3.3 70B", - "display_name": "Llama 3.3 70B", + "id": "sarvam-105b", + "name": "Sarvam-105B", + "display_name": "Sarvam-105B", "modalities": { "input": [ "text" @@ -144794,113 +153133,104 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2024-12-05", - "last_updated": "2024-12-05", - "cost": { - "input": 0.49, - "output": 0.71 - }, + "release_date": "2026-02-18", + "last_updated": "2026-03-06", "type": "chat" - }, + } + ] + }, + "zhipuai": { + "id": "zhipuai", + "name": "Zhipu AI", + "display_name": "Zhipu AI", + "api": "https://open.bigmodel.cn/api/paas/v4", + "doc": "https://docs.z.ai/guides/overview/pricing", + "models": [ { - "id": "google/gemma-3-27b-it", - "name": "Gemma 3 27B", - "display_name": "Gemma 3 27B", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 37000, - "output": 8192 + "context": 200000, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2025-05-17", - "last_updated": "2025-05-17", - "cost": { - "input": 0.49, - "output": 0.71 - }, - "type": "chat" - }, - { - "id": "intfloat/e5-mistral-7b-instruct", - "name": "E5 Mistral 7B", - "display_name": "E5 Mistral 7B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 4096, - "output": 4096 + "supported": true, + "default": true }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, - "release_date": "2023-12-11", - "last_updated": "2023-12-11", + "open_weights": false, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.02, - "output": 0.02 + "input": 6, + "output": 24, + "cache_read": 1.3, + "cache_write": 0 }, "type": "chat" - } - ] - }, - "tencent-coding-plan": { - "id": "tencent-coding-plan", - "name": "Tencent Coding Plan (China)", - "display_name": "Tencent Coding Plan (China)", - "api": "https://api.lkeap.cloud.tencent.com/coding/v3", - "doc": "https://cloud.tencent.com/document/product/1772/128947", - "models": [ + }, { - "id": "kimi-k2.5", - "name": "Kimi-K2.5", - "display_name": "Kimi-K2.5", + "id": "glm-5v-turbo", + "name": "GLM-5V-Turbo", + "display_name": "GLM-5V-Turbo", "modalities": { "input": [ "text", "image", - "video" + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -144920,14 +153250,13 @@ } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "open_weights": false, + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, + "input": 5, + "output": 22, + "cache_read": 1.2, "cache_write": 0 }, "type": "chat" @@ -144945,8 +153274,8 @@ ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -144966,54 +153295,56 @@ } }, "attachment": false, - "open_weights": false, + "open_weights": true, "release_date": "2026-02-11", - "last_updated": "2026-02-11", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0, + "last_updated": "2026-02-11", + "cost": { + "input": 1, + "output": 3.2, + "cache_read": 0.2, "cache_write": 0 }, "type": "chat" }, { - "id": "hunyuan-turbos", - "name": "Hunyuan-TurboS", - "display_name": "Hunyuan-TurboS", + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2026-03-08", - "last_updated": "2026-03-08", + "attachment": true, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "hunyuan-t1", - "name": "Hunyuan-T1", - "display_name": "Hunyuan-T1", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -145023,8 +153354,8 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -145044,21 +153375,22 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-08", - "last_updated": "2026-03-08", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, "cache_write": 0 }, "type": "chat" }, { - "id": "hunyuan-2.0-instruct", - "name": "Tencent HY 2.0 Instruct", - "display_name": "Tencent HY 2.0 Instruct", + "id": "glm-4.5-flash", + "name": "GLM-4.5-Flash", + "display_name": "GLM-4.5-Flash", "modalities": { "input": [ "text" @@ -145069,17 +153401,19 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-08", - "last_updated": "2026-03-08", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { "input": 0, "output": 0, @@ -145089,9 +153423,9 @@ "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -145101,8 +153435,8 @@ ] }, "limit": { - "context": 204800, - "output": 32768 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -145110,33 +153444,23 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, "cache_write": 0 }, "type": "chat" }, { - "id": "tc-code-latest", - "name": "Auto", - "display_name": "Auto", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -145146,30 +153470,37 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-08", - "last_updated": "2026-03-08", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, "cache_write": 0 }, "type": "chat" }, { - "id": "hunyuan-2.0-thinking", - "name": "Tencent HY 2.0 Think", - "display_name": "Tencent HY 2.0 Think", + "id": "glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ "text" @@ -145179,8 +153510,8 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -145190,19 +153521,14 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-08", - "last_updated": "2026-03-08", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { "input": 0, "output": 0, @@ -145210,85 +153536,81 @@ "cache_write": 0 }, "type": "chat" - } - ] - }, - "privatemode-ai": { - "id": "privatemode-ai", - "name": "Privatemode AI", - "display_name": "Privatemode AI", - "api": "http://localhost:8080/v1", - "doc": "https://docs.privatemode.ai/api/overview", - "models": [ + }, { - "id": "gemma-3-27b", - "name": "Gemma 3 27B", - "display_name": "Gemma 3 27B", + "id": "glm-4.5v", + "name": "GLM-4.5V", + "display_name": "GLM-4.5V", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 64000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-03-12", - "last_updated": "2025-03-12", + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 1.8 }, "type": "chat" }, { - "id": "whisper-large-v3", - "name": "Whisper large-v3", - "display_name": "Whisper large-v3", + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 131072, + "output": 98304 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2023-09", - "release_date": "2023-09-01", - "last_updated": "2023-09-01", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0, - "output": 0 + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen3-embedding-4b", - "name": "Qwen3-Embedding 4B", - "display_name": "Qwen3-Embedding 4B", + "id": "glm-4.7-flashx", + "name": "GLM-4.7-FlashX", + "display_name": "GLM-4.7-FlashX", "modalities": { "input": [ "text" @@ -145298,29 +153620,41 @@ ] }, "limit": { - "context": 32000, - "output": 2560 + "context": 200000, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-06-06", - "last_updated": "2025-06-06", + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0, - "output": 0 + "input": 0.07, + "output": 0.4, + "cache_read": 0.01, + "cache_write": 0 }, - "type": "embedding" - }, + "type": "chat" + } + ] + }, + "bailing": { + "id": "bailing", + "name": "Bailing", + "display_name": "Bailing", + "api": "https://api.tbox.cn/api/llm/v1/chat/completions", + "doc": "https://alipaytbox.yuque.com/sxs0ba/ling/intro", + "models": [ { - "id": "gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "Ring-1T", + "name": "Ring-1T", + "display_name": "Ring-1T", "modalities": { "input": [ "text" @@ -145331,10 +153665,10 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -145346,19 +153680,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-04", - "last_updated": "2025-08-14", + "knowledge": "2024-06", + "release_date": "2025-10", + "last_updated": "2025-10", "cost": { - "input": 0, - "output": 0 + "input": 0.57, + "output": 2.29 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b", - "name": "Qwen3-Coder 30B-A3B", - "display_name": "Qwen3-Coder 30B-A3B", + "id": "Ling-1T", + "name": "Ling-1T", + "display_name": "Ling-1T", "modalities": { "input": [ "text" @@ -145369,7 +153703,7 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 32000 }, "temperature": true, "tool_call": true, @@ -145378,33 +153712,88 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "knowledge": "2024-06", + "release_date": "2025-10", + "last_updated": "2025-10", "cost": { - "input": 0, - "output": 0 + "input": 0.57, + "output": 2.29 }, "type": "chat" } ] }, - "google": { - "id": "google", - "name": "google", - "display_name": "google", - "doc": "https://ai.google.dev/gemini-api/docs/models", + "qihang-ai": { + "id": "qihang-ai", + "name": "QiHang", + "display_name": "QiHang", + "api": "https://api.qhaigc.net/v1", + "doc": "https://www.qhaigc.net/docs", "models": [ { - "id": "gemini-flash-lite-latest", - "name": "Gemini Flash-Lite Latest", - "display_name": "Gemini Flash-Lite Latest", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 0.25, + "output": 2 + }, + "type": "chat" + }, + { + "id": "claude-haiku-4-5-20251001", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -145412,8 +153801,8 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -145423,35 +153812,33 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-07-31", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.14, + "output": 0.71 }, "type": "chat" }, { - "id": "gemini-2.5-pro-preview-05-06", - "name": "Gemini 2.5 Pro Preview 05-06", - "display_name": "Gemini 2.5 Pro Preview 05-06", + "id": "gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ "text", "image", "audio", - "video", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 65000 }, "temperature": true, "tool_call": true, @@ -145463,14 +153850,12 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ @@ -145480,58 +153865,88 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-06", - "last_updated": "2025-05-06", + "knowledge": "2025-11", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 + "input": 0.57, + "output": 3.43 }, "type": "chat" }, { - "id": "gemini-live-2.5-flash-preview-native-audio", - "name": "Gemini Live 2.5 Flash Preview Native Audio", - "display_name": "Gemini Live 2.5 Flash Preview Native Audio", + "id": "claude-opus-4-5-20251101", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ "text", - "audio", - "video" + "image" ], "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", + "cost": { + "input": 0.71, + "output": 3.57 + }, + "type": "chat" + }, + { + "id": "claude-sonnet-4-5-20250929", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", + "modalities": { + "input": [ "text", - "audio" + "image", + "pdf" + ], + "output": [ + "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-09-18", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.5, - "output": 2, - "input_audio": 3, - "output_audio": 12 + "input": 0.43, + "output": 2.14 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview-customtools", - "name": "Gemini 3.1 Pro Preview Custom Tools", - "display_name": "Gemini 3.1 Pro Preview Custom Tools", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ "text", @@ -145561,7 +153976,9 @@ "mode": "level", "level": "high", "level_options": [ + "minimal", "low", + "medium", "high" ], "summaries": true, @@ -145574,24 +153991,32 @@ "attachment": true, "open_weights": false, "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, + "input": 0.07, + "output": 0.43, + "tiers": [ + { + "input": 0.07, + "output": 0.43, + "tier": { + "type": "context", + "size": 200000 + } + } + ], "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 + "input": 0.07, + "output": 0.43 } }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-09-2025", - "name": "Gemini 2.5 Flash Lite Preview 09 2025", - "display_name": "Gemini 2.5 Flash Lite Preview 09 2025", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ "text", @@ -145601,6 +154026,64 @@ "text" ] }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 0.14, + "output": 1.14 + }, + "type": "chat" + }, + { + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, "limit": { "context": 1048576, "output": 65536 @@ -145609,23 +154092,19 @@ "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": -1, - "min": 512, - "max": 24576 - } + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "budget", "budget": { "default": -1, - "min": 512, + "min": 0, "max": 24576, "auto": -1, + "off": 0, "unit": "tokens" }, "summaries": true, @@ -145635,98 +154114,145 @@ ] } }, - "search": { - "supported": true, - "default": false - }, "attachment": true, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.09, + "output": 0.71, + "tiers": [ + { + "input": 0.09, + "output": 0.71, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 0.09, + "output": 0.71 + } }, "type": "chat" }, { - "id": "gemini-1.5-flash", - "name": "Gemini 1.5 Flash", - "display_name": "Gemini 1.5 Flash", + "id": "gpt-5-mini", + "name": "GPT-5-Mini", + "display_name": "GPT-5-Mini", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-05-14", - "last_updated": "2024-05-14", + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.075, - "output": 0.3, - "cache_read": 0.01875 + "input": 0.04, + "output": 0.29 }, "type": "chat" - }, + } + ] + }, + "lilac": { + "id": "lilac", + "name": "Lilac", + "display_name": "Lilac", + "api": "https://api.getlilac.com/v1", + "doc": "https://docs.getlilac.com/inference/models", + "models": [ { - "id": "gemini-1.5-pro", - "name": "Gemini 1.5 Pro", - "display_name": "Gemini 1.5 Pro", + "id": "moonshotai/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-02-15", - "last_updated": "2024-02-15", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 1.25, - "output": 5, - "cache_read": 0.3125 + "input": 0.7, + "output": 3.5, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "gemma-3n-e4b-it", - "name": "Gemma 3n 4B", - "display_name": "Gemma 3n 4B", + "id": "zai-org/glm-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ "text" @@ -145736,44 +154262,55 @@ ] }, "limit": { - "context": 8192, - "output": 2000 + "context": 202800, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "knowledge": "2025-04", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0, - "output": 0 + "input": 0.9, + "output": 3, + "cache_read": 0.27 }, "type": "chat" }, { - "id": "gemini-3.1-flash-lite-preview", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "google/gemma-4-31b-it", + "name": "Gemma 4 31B IT", + "display_name": "Gemma 4 31B IT", "modalities": { "input": [ "text", "image", - "video", - "audio", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262100, + "output": 262100 }, "temperature": true, "tool_call": true, @@ -145783,41 +154320,41 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, + "open_weights": true, "knowledge": "2025-01", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "input": 0.11, + "output": 0.35 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "minimaxai/minimax-m2.7", + "name": "MiniMax M2.7", + "display_name": "MiniMax M2.7", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 204800, + "output": 204800 }, "temperature": true, "tool_call": true, @@ -145828,189 +154365,149 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, + "attachment": false, + "open_weights": true, "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.3, + "output": 1.2, + "cache_read": 0.055 }, "type": "chat" - }, + } + ] + }, + "alibaba-cn": { + "id": "alibaba-cn", + "name": "alibaba-cn", + "display_name": "alibaba-cn", + "api": "https://dashscope.aliyuncs.com/compatible-mode/v1", + "doc": "https://www.alibabacloud.com/help/en/model-studio/models", + "models": [ { - "id": "gemini-2.0-flash", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "qwen2-5-math-7b-instruct", + "name": "Qwen2.5-Math 7B Instruct", + "display_name": "Qwen2.5-Math 7B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 4096, + "output": 3072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "search": { - "supported": true, - "default": false + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.144, + "output": 0.287 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "qwen2-5-7b-instruct", + "name": "Qwen2.5 7B Instruct", + "display_name": "Qwen2.5 7B Instruct", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "context_over_200k": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 - } + "input": 0.072, + "output": 0.144 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-tts", - "name": "Gemini 2.5 Flash Preview TTS", - "display_name": "Gemini 2.5 Flash Preview TTS", + "id": "qwen2-5-vl-72b-instruct", + "name": "Qwen2.5-VL 72B Instruct", + "display_name": "Qwen2.5-VL 72B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8000, - "output": 16000 + "context": 131072, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.5, - "output": 10 + "input": 2.294, + "output": 6.881 }, "type": "chat" }, { - "id": "gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "kimi-k2.5", + "name": "Moonshot Kimi K2.5", + "display_name": "Moonshot Kimi K2.5", "modalities": { "input": [ "text", "image", - "video", - "audio", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -146021,55 +154518,41 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, + "attachment": false, + "open_weights": true, "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.574, + "output": 2.411 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-05-20", - "name": "Gemini 2.5 Flash Preview 05-20", - "display_name": "Gemini 2.5 Flash Preview 05-20", + "id": "qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ "text", "image", - "audio", - "video", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 1000000, "output": 65536 }, "temperature": true, @@ -146081,39 +154564,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.0375 + "input": 0.573, + "output": 3.44, + "reasoning": 3.44 }, "type": "chat" }, { - "id": "gemini-embedding-001", - "name": "Gemini Embedding 001", - "display_name": "Gemini Embedding 001", + "id": "qwen-math-turbo", + "name": "Qwen Math Turbo", + "display_name": "Qwen Math Turbo", "modalities": { "input": [ "text" @@ -146123,180 +154597,168 @@ ] }, "limit": { - "context": 2048, + "context": 4096, "output": 3072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "knowledge": "2024-04", + "release_date": "2024-09-19", + "last_updated": "2024-09-19", "cost": { - "input": 0.15, - "output": 0 + "input": 0.287, + "output": 0.861 }, - "type": "embedding" + "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 202752, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": -1, - "min": 128, - "max": 32768 - } + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "search": { - "supported": true, - "default": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-14", + "last_updated": "2026-04-14", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 0.87, + "output": 3.48, + "cache_read": 0.17 }, "type": "chat" }, { - "id": "gemini-flash-latest", - "name": "Gemini Flash Latest", - "display_name": "Gemini Flash Latest", + "id": "qwen3-vl-plus", + "name": "Qwen3 VL Plus", + "display_name": "Qwen3 VL Plus", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "input_audio": 1 + "input": 0.143353, + "output": 1.433525, + "reasoning": 4.300576 }, "type": "chat" }, { - "id": "gemma-4-31b-it", - "name": "Gemma 4 31B", - "display_name": "Gemma 4 31B", + "id": "qwen2-5-math-72b-instruct", + "name": "Qwen2.5-Math 72B Instruct", + "display_name": "Qwen2.5-Math 72B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 4096, + "output": 3072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", + "cost": { + "input": 0.574, + "output": 1.721 + }, "type": "chat" }, { - "id": "gemini-2.5-pro-preview-06-05", - "name": "Gemini 2.5 Pro Preview 06-05", - "display_name": "Gemini 2.5 Pro Preview 06-05", + "id": "qwen3-vl-235b-a22b", + "name": "Qwen3-VL 235B-A22B", + "display_name": "Qwen3-VL 235B-A22B", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -146307,229 +154769,204 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 + "input": 0.286705, + "output": 1.14682, + "reasoning": 2.867051 }, "type": "chat" }, { - "id": "gemini-2.5-flash-image", - "name": "Gemini 2.5 Flash Image", - "display_name": "Gemini 2.5 Flash Image", + "id": "deepseek-r1-distill-llama-8b", + "name": "DeepSeek R1 Distill Llama 8B", + "display_name": "DeepSeek R1 Distill Llama 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { "context": 32768, - "output": 32768 + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.3, - "output": 30, - "cache_read": 0.075 + "input": 0, + "output": 0 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-06-17", - "name": "Gemini 2.5 Flash Lite Preview 06-17", - "display_name": "Gemini 2.5 Flash Lite Preview 06-17", + "id": "deepseek-r1", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025, - "input_audio": 0.3 + "input": 0.574, + "output": 2.294 }, "type": "chat" }, { - "id": "gemma-3-12b-it", - "name": "Gemma 3 12B", - "display_name": "Gemma 3 12B", + "id": "qwq-32b", + "name": "QwQ 32B", + "display_name": "QwQ 32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 131072, "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "knowledge": "2024-04", + "release_date": "2024-12", + "last_updated": "2024-12", "cost": { - "input": 0, - "output": 0 + "input": 0.287, + "output": 0.861 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "qwq-plus", + "name": "QwQ Plus", + "display_name": "QwQ Plus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true, "budget": { - "default": -1, + "default": 32768, "min": 0, - "max": 24576 + "max": 32768 } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "search": { "supported": true, - "default": false + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2024-04", + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.03, - "input_audio": 1 + "input": 0.23, + "output": 0.574 }, "type": "chat" }, { - "id": "gemma-3n-e2b-it", - "name": "Gemma 3n 2B", - "display_name": "Gemma 3n 2B", + "id": "qwen3-8b", + "name": "Qwen3 8B", + "display_name": "Qwen3 8B", "modalities": { "input": [ "text" @@ -146539,85 +154976,101 @@ ] }, "limit": { - "context": 8192, - "output": 2000 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0, - "output": 0 + "input": 0.072, + "output": 0.287, + "reasoning": 0.717 }, "type": "chat" }, { - "id": "gemini-3.1-flash-image-preview", - "name": "Gemini 3.1 Flash Image (Preview)", - "display_name": "Gemini 3.1 Flash Image (Preview)", + "id": "deepseek-r1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { "context": 131072, - "output": 32768 + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.25, - "output": 60 + "input": 0.574, + "output": 2.294 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "gemini-3.1-flash-lite", - "name": "Gemini 3.1 Flash Lite", - "display_name": "Gemini 3.1 Flash Lite", + "id": "deepseek-r1-distill-qwen-1-5b", + "name": "DeepSeek R1 Distill Qwen 1.5B", + "display_name": "DeepSeek R1 Distill Qwen 1.5B", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -146625,310 +155078,298 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-05-07", - "last_updated": "2026-05-07", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gemma-3-4b-it", - "name": "Gemma 3 4B", - "display_name": "Gemma 3 4B", + "id": "qwen2-5-coder-32b-instruct", + "name": "Qwen2.5-Coder 32B Instruct", + "display_name": "Qwen2.5-Coder 32B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 131072, "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "knowledge": "2024-04", + "release_date": "2024-11", + "last_updated": "2024-11", "cost": { - "input": 0, - "output": 0 + "input": 0.287, + "output": 0.861 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-04-17", - "name": "Gemini 2.5 Flash Preview 04-17", - "display_name": "Gemini 2.5 Flash Preview 04-17", + "id": "tongyi-intent-detect-v3", + "name": "Tongyi Intent Detect V3", + "display_name": "Tongyi Intent Detect V3", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 8192, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", + "cost": { + "input": 0.058, + "output": 0.144 }, - "attachment": true, + "type": "chat" + }, + { + "id": "deepseek-v3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 65536, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-04-17", - "last_updated": "2025-04-17", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.0375 + "input": 0.287, + "output": 1.147 }, "type": "chat" }, { - "id": "gemini-2.5-pro-preview-tts", - "name": "Gemini 2.5 Pro Preview TTS", - "display_name": "Gemini 2.5 Pro Preview TTS", + "id": "qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8000, - "output": 16000 + "context": 262144, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 1, - "output": 20 + "input": 0.861, + "output": 3.441 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-09-2025", - "name": "Gemini 2.5 Flash Preview 09 2025", - "display_name": "Gemini 2.5 Flash Preview 09 2025", + "id": "qwen3-235b-a22b", + "name": "Qwen3 235B A22B", + "display_name": "Qwen3 235B A22B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, + "default": false, "budget": { - "default": -1, + "default": 81920, "min": 0, - "max": 24576 + "max": 81920 } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "search": { - "supported": true, - "default": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "input_audio": 1 + "input": 0.287, + "output": 1.147, + "reasoning": 2.868 }, "type": "chat" }, { - "id": "gemma-3-27b-it", - "name": "Gemma 3 27B", - "display_name": "Gemma 3 27B", + "id": "qwen3.5-397b-a17b", + "name": "Qwen3.5 397B-A17B", + "display_name": "Qwen3.5 397B-A17B", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-03-12", - "last_updated": "2025-03-12", + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0, - "output": 0 + "input": 0.43, + "output": 2.58, + "reasoning": 2.58 }, "type": "chat" }, { - "id": "gemma-4-26b-a4b-it", - "name": "Gemma 4 26B", - "display_name": "Gemma 4 26B", + "id": "qwen-doc-turbo", + "name": "Qwen Doc Turbo", + "display_name": "Qwen Doc Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 131072, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", + "cost": { + "input": 0.087, + "output": 0.144 + }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "qwen-flash", + "name": "Qwen Flash", + "display_name": "Qwen Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -146936,234 +155377,168 @@ "supported": true, "default": false, "budget": { - "default": -1, - "min": 512, - "max": 24576 + "default": 81920, + "min": 0, + "max": 81920 } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "search": { "supported": true, - "default": false + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2024-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.022, + "output": 0.216 }, "type": "chat" }, { - "id": "gemini-2.5-flash-image-preview", - "name": "Gemini 2.5 Flash Image Preview", - "display_name": "Gemini 2.5 Flash Image Preview", + "id": "qwen-omni-turbo-realtime", + "name": "Qwen-Omni Turbo Realtime", + "display_name": "Qwen-Omni Turbo Realtime", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ "text", - "image" + "audio" ] }, "limit": { "context": 32768, - "output": 32768 + "output": 2048 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "knowledge": "2024-04", + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "cost": { - "input": 0.3, - "output": 30, - "cache_read": 0.075 + "input": 0.23, + "output": 0.918, + "input_audio": 3.584, + "output_audio": 7.168 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "gemini-1.5-flash-8b", - "name": "Gemini 1.5 Flash-8B", - "display_name": "Gemini 1.5 Flash-8B", + "id": "qwen-mt-turbo", + "name": "Qwen Mt Turbo", + "display_name": "Qwen Mt Turbo", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 16384, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2024-04", - "release_date": "2024-10-03", - "last_updated": "2024-10-03", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 0.0375, - "output": 0.15, - "cache_read": 0.01 + "input": 0.101, + "output": 0.28 }, "type": "chat" }, { - "id": "gemini-live-2.5-flash", - "name": "Gemini Live 2.5 Flash", - "display_name": "Gemini Live 2.5 Flash", + "id": "qwen-turbo", + "name": "Qwen Turbo", + "display_name": "Qwen Turbo", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 128000, - "output": 8000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-01", - "last_updated": "2025-09-01", - "cost": { - "input": 0.5, - "output": 2, - "input_audio": 3, - "output_audio": 12 - }, - "type": "chat" - }, - { - "id": "gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash Lite", - "display_name": "Gemini 2.0 Flash Lite", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1048576, - "output": 8192 + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "search": { - "supported": false + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2024-04", + "release_date": "2024-11-01", + "last_updated": "2025-07-15", "cost": { - "input": 0.075, - "output": 0.3 + "input": 0.044, + "output": 0.087, + "reasoning": 0.431 }, "type": "chat" }, { - "id": "gemini-2.0-flash-preview-image-generation", - "name": "Gemini 2.0 Flash Preview Image Generation", - "display_name": "Gemini 2.0 Flash Preview Image Generation", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text", - "image" - ] - }, - "limit": { - "context": 32000, - "output": 8192 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "search": { - "supported": false - }, - "attachment": true, - "type": "chat" - } - ] - }, - "drun": { - "id": "drun", - "name": "D.Run (China)", - "display_name": "D.Run (China)", - "api": "https://chat.d.run/v1", - "doc": "https://www.d.run", - "models": [ - { - "id": "public/deepseek-r1", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "moonshot-kimi-k2-instruct", + "name": "Moonshot Kimi K2 Instruct", + "display_name": "Moonshot Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -147174,40 +155549,27 @@ }, "limit": { "context": 131072, - "output": 32000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.55, - "output": 2.2 + "input": 0.574, + "output": 2.294 }, "type": "chat" }, { - "id": "public/minimax-m25", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "qwen-max", + "name": "Qwen Max", + "display_name": "Qwen Max", "modalities": { "input": [ "text" @@ -147217,43 +155579,39 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, "open_weights": false, - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "knowledge": "2024-04", + "release_date": "2024-04-03", + "last_updated": "2025-01-25", "cost": { - "input": 0.29, - "output": 1.16 + "input": 0.345, + "output": 1.377 }, "type": "chat" }, { - "id": "public/deepseek-v3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "qwen2-5-vl-7b-instruct", + "name": "Qwen2.5-VL 7B Instruct", + "display_name": "Qwen2.5-VL 7B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -147270,28 +155628,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-12-26", - "last_updated": "2024-12-26", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.28, - "output": 1.1 + "input": 0.287, + "output": 0.717 }, "type": "chat" - } - ] - }, - "moonshot-ai": { - "id": "moonshot-ai", - "name": "Moonshot AI", - "display_name": "Moonshot AI", - "api": "https://api.moonshot.ai/v1", - "doc": "https://platform.moonshot.ai/docs/api/chat", - "models": [ + }, { - "id": "kimi-k2-0905-preview", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "qwen2-5-32b-instruct", + "name": "Qwen2.5 32B Instruct", + "display_name": "Qwen2.5 32B Instruct", "modalities": { "input": [ "text" @@ -147301,8 +155650,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -147311,67 +155660,51 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 0.287, + "output": 0.861 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "qwen3-asr-flash", + "name": "Qwen3-ASR Flash", + "display_name": "Qwen3-ASR Flash", "modalities": { "input": [ - "text", - "image", - "video" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 53248, + "output": 4096 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-09-08", + "last_updated": "2025-09-08", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 0.032, + "output": 0.032 }, "type": "chat" }, { - "id": "kimi-k2-thinking-turbo", - "name": "Kimi K2 Thinking Turbo", - "display_name": "Kimi K2 Thinking Turbo", + "id": "qwen-math-plus", + "name": "Qwen Math Plus", + "display_name": "Qwen Math Plus", "modalities": { "input": [ "text" @@ -147381,42 +155714,29 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 4096, + "output": 3072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-08-16", + "last_updated": "2024-09-19", "cost": { - "input": 1.15, - "output": 8, - "cache_read": 0.15 + "input": 0.574, + "output": 1.721 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ "text", @@ -147428,8 +155748,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -147448,22 +155768,41 @@ ] } }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "attachment": false, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 0.625, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5 + } }, "type": "chat" }, { - "id": "kimi-k2-turbo-preview", - "name": "Kimi K2 Turbo", - "display_name": "Kimi K2 Turbo", + "id": "qwen3-coder-flash", + "name": "Qwen3 Coder Flash", + "display_name": "Qwen3 Coder Flash", "modalities": { "input": [ "text" @@ -147473,8 +155812,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -147482,21 +155821,20 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 2.4, - "output": 10, - "cache_read": 0.6 + "input": 0.144, + "output": 0.574 }, "type": "chat" }, { - "id": "kimi-k2-0711-preview", - "name": "Kimi K2 0711", - "display_name": "Kimi K2 0711", + "id": "qwen-plus-character", + "name": "Qwen Plus Character", + "display_name": "Qwen Plus Character", "modalities": { "input": [ "text" @@ -147506,8 +155844,8 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 32768, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -147515,21 +155853,20 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-14", - "last_updated": "2025-07-14", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 0.115, + "output": 0.287 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ "text" @@ -147539,14 +155876,19 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "extra_capabilities": { "reasoning": { @@ -147561,29 +155903,20 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 0.287, + "output": 1.147, + "reasoning": 2.868 }, "type": "chat" - } - ] - }, - "berget": { - "id": "berget", - "name": "Berget.AI", - "display_name": "Berget.AI", - "api": "https://api.berget.ai/v1", - "doc": "https://api.berget.ai", - "models": [ + }, { - "id": "zai-org/GLM-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ "text" @@ -147593,14 +155926,19 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { @@ -147615,19 +155953,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 0.77, - "output": 2.75 + "input": 0.144, + "output": 1.434 }, "type": "chat" }, { - "id": "mistralai/Mistral-Small-3.2-24B-Instruct-2506", - "name": "Mistral Small 3.2 24B Instruct 2506", - "display_name": "Mistral Small 3.2 24B Instruct 2506", + "id": "kimi-k2-thinking", + "name": "Moonshot Kimi K2 Thinking", + "display_name": "Moonshot Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -147637,8 +155975,8 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -147646,24 +155984,33 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-10-01", - "last_updated": "2025-10-01", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.33, - "output": 0.33 + "input": 0.574, + "output": 2.294 }, "type": "chat" }, { - "id": "mistralai/Mistral-Medium-3.5-128B", - "name": "Mistral Medium 3.5 128B", - "display_name": "Mistral Medium 3.5 128B", + "id": "deepseek-r1-distill-qwen-14b", + "name": "DeepSeek R1 Distill Qwen 14B", + "display_name": "DeepSeek R1 Distill Qwen 14B", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -147671,8 +156018,8 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -147680,21 +156027,20 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2026-04", - "release_date": "2026-04-29", - "last_updated": "2026-04-29", + "attachment": false, + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.65, - "output": 5.5 + "input": 0.144, + "output": 0.431 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "qwen-deep-research", + "name": "Qwen Deep Research", + "display_name": "Qwen Deep Research", "modalities": { "input": [ "text" @@ -147704,30 +156050,29 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-04-27", - "last_updated": "2025-04-27", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "cost": { - "input": 0.99, - "output": 0.99 + "input": 7.742, + "output": 23.367 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT-OSS-120B", - "display_name": "GPT-OSS-120B", + "id": "qwen-mt-plus", + "name": "Qwen Mt Plus", + "display_name": "Qwen Mt Plus", "modalities": { "input": [ "text" @@ -147737,10 +156082,42 @@ ] }, "limit": { - "context": 128000, + "context": 16384, "output": 8192 }, "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01", + "last_updated": "2025-01", + "cost": { + "input": 0.259, + "output": 0.775 + }, + "type": "chat" + }, + { + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -147748,113 +156125,112 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.44, - "output": 0.99 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "google/gemma-4-31B-it", - "name": "Gemma 4 31B Instruct", - "display_name": "Gemma 4 31B Instruct", + "id": "qwen-vl-plus", + "name": "Qwen-VL Plus", + "display_name": "Qwen-VL Plus", "modalities": { "input": [ - "audio", - "image", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-08-15", "cost": { - "input": 0.275, - "output": 0.55 + "input": 0.115, + "output": 0.287 }, "type": "chat" - } - ] - }, - "github-models": { - "id": "github-models", - "name": "GitHub Models", - "display_name": "GitHub Models", - "api": "https://models.github.ai/inference", - "doc": "https://docs.github.com/en/github-models", - "models": [ + }, { - "id": "deepseek/deepseek-v3-0324", - "name": "DeepSeek-V3-0324", - "display_name": "DeepSeek-V3-0324", + "id": "qwen-omni-turbo", + "name": "Qwen-Omni Turbo", + "display_name": "Qwen-Omni Turbo", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 32768, + "output": 2048 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01-19", + "last_updated": "2025-03-26", "cost": { - "input": 0, - "output": 0 + "input": 0.058, + "output": 0.23, + "input_audio": 3.584, + "output_audio": 7.168 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "qwen3-vl-30b-a3b", + "name": "Qwen3-VL 30B-A3B", + "display_name": "Qwen3-VL 30B-A3B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -147875,19 +156251,20 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0, - "output": 0 + "input": 0.108, + "output": 0.431, + "reasoning": 1.076 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ "text" @@ -147897,8 +156274,8 @@ ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -147908,30 +156285,23 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0, - "output": 0 + "input": 0.287, + "output": 0.861 }, "type": "chat" }, { - "id": "ai21-labs/ai21-jamba-1.5-mini", - "name": "AI21 Jamba 1.5 Mini", - "display_name": "AI21 Jamba 1.5 Mini", + "id": "deepseek-v3-1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text" @@ -147941,41 +156311,41 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-08-29", - "last_updated": "2024-08-29", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0, - "output": 0 + "input": 0.574, + "output": 1.721 }, "type": "chat" }, { - "id": "ai21-labs/ai21-jamba-1.5-large", - "name": "AI21 Jamba 1.5 Large", - "display_name": "AI21 Jamba 1.5 Large", + "id": "qwen3.5-flash", + "name": "Qwen3.5 Flash", + "display_name": "Qwen3.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -147983,54 +156353,66 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-08-29", - "last_updated": "2024-08-29", + "knowledge": "2025-04", + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 0, - "output": 0 + "input": 0.172, + "output": 1.72, + "reasoning": 1.72 }, "type": "chat" }, { - "id": "microsoft/phi-3.5-mini-instruct", - "name": "Phi-3.5-mini instruct (128k)", - "display_name": "Phi-3.5-mini instruct (128k)", + "id": "qwen-vl-ocr", + "name": "Qwen Vl Ocr", + "display_name": "Qwen Vl Ocr", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 34096, "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-10-28", + "last_updated": "2025-04-13", "cost": { - "input": 0, - "output": 0 + "input": 0.717, + "output": 0.717 }, "type": "chat" }, { - "id": "microsoft/phi-3-medium-4k-instruct", - "name": "Phi-3-medium instruct (4k)", - "display_name": "Phi-3-medium instruct (4k)", + "id": "qwen-long", + "name": "Qwen Long", + "display_name": "Qwen Long", "modalities": { "input": [ "text" @@ -148040,30 +156422,29 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 1000000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01-25", + "last_updated": "2025-01-25", "cost": { - "input": 0, - "output": 0 + "input": 0.072, + "output": 0.287 }, "type": "chat" }, { - "id": "microsoft/phi-3.5-moe-instruct", - "name": "Phi-3.5-MoE instruct (128k)", - "display_name": "Phi-3.5-MoE instruct (128k)", + "id": "deepseek-r1-distill-qwen-32b", + "name": "DeepSeek R1 Distill Qwen 32B", + "display_name": "DeepSeek R1 Distill Qwen 32B", "modalities": { "input": [ "text" @@ -148073,8 +156454,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -148083,31 +156464,34 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0, - "output": 0 + "input": 0.287, + "output": 0.861 }, "type": "chat" }, { - "id": "microsoft/phi-3-mini-128k-instruct", - "name": "Phi-3-mini instruct (128k)", - "display_name": "Phi-3-mini instruct (128k)", + "id": "qwen3-omni-flash", + "name": "Qwen3-Omni Flash", + "display_name": "Qwen3-Omni Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 65536, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -148115,21 +156499,34 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0, - "output": 0 + "input": 0.058, + "output": 0.23, + "input_audio": 3.584, + "output_audio": 7.168 }, "type": "chat" }, { - "id": "microsoft/phi-4-mini-instruct", - "name": "Phi-4-mini-instruct", - "display_name": "Phi-4-mini-instruct", + "id": "qwen2-5-14b-instruct", + "name": "Qwen2.5 14B Instruct", + "display_name": "Qwen2.5 14B Instruct", "modalities": { "input": [ "text" @@ -148139,30 +156536,29 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0, - "output": 0 + "input": 0.144, + "output": 0.431 }, "type": "chat" }, { - "id": "microsoft/phi-4-reasoning", - "name": "Phi-4-Reasoning", - "display_name": "Phi-4-Reasoning", + "id": "qwen2-5-72b-instruct", + "name": "Qwen2.5 72B Instruct", + "display_name": "Qwen2.5 72B Instruct", "modalities": { "input": [ "text" @@ -148172,30 +156568,29 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0, - "output": 0 + "input": 0.574, + "output": 1.721 }, "type": "chat" }, { - "id": "microsoft/phi-3-small-8k-instruct", - "name": "Phi-3-small instruct (8k)", - "display_name": "Phi-3-small instruct (8k)", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "Qwen3-Coder 480B-A35B Instruct", + "display_name": "Qwen3-Coder 480B-A35B Instruct", "modalities": { "input": [ "text" @@ -148205,30 +156600,29 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0, - "output": 0 + "input": 0.861, + "output": 3.441 }, "type": "chat" }, { - "id": "microsoft/phi-3.5-vision-instruct", - "name": "Phi-3.5-vision instruct (128k)", - "display_name": "Phi-3.5-vision instruct (128k)", + "id": "qvq-max", + "name": "QVQ Max", + "display_name": "QVQ Max", "modalities": { "input": [ "text", @@ -148239,8 +156633,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -148249,20 +156643,20 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0, - "output": 0 + "input": 1.147, + "output": 4.588 }, "type": "chat" }, { - "id": "microsoft/phi-3-mini-4k-instruct", - "name": "Phi-3-mini instruct (4k)", - "display_name": "Phi-3-mini instruct (4k)", + "id": "qwen3.6-max-preview", + "name": "Qwen3.6 Max Preview", + "display_name": "Qwen3.6 Max Preview", "modalities": { "input": [ "text" @@ -148272,8 +156666,8 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 245800, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -148281,21 +156675,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "open_weights": false, + "release_date": "2026-04-20", + "last_updated": "2026-04-21", "cost": { - "input": 0, - "output": 0 + "input": 1.32, + "output": 7.9, + "cache_read": 0.132 }, "type": "chat" }, { - "id": "microsoft/phi-4-mini-reasoning", - "name": "Phi-4-mini-reasoning", - "display_name": "Phi-4-mini-reasoning", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder 30B-A3B Instruct", + "display_name": "Qwen3-Coder 30B-A3B Instruct", "modalities": { "input": [ "text" @@ -148305,30 +156710,66 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0, - "output": 0 + "input": 0.216, + "output": 0.861 }, "type": "chat" }, { - "id": "microsoft/phi-3-small-128k-instruct", - "name": "Phi-3-small instruct (128k)", - "display_name": "Phi-3-small instruct (128k)", + "id": "qwen3-omni-flash-realtime", + "name": "Qwen3-Omni Flash Realtime", + "display_name": "Qwen3-Omni Flash Realtime", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text", + "audio" + ] + }, + "limit": { + "context": 65536, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", + "cost": { + "input": 0.23, + "output": 0.918, + "input_audio": 3.584, + "output_audio": 7.168 + }, + "type": "chat" + }, + { + "id": "qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ "text" @@ -148338,30 +156779,29 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 0, - "output": 0 + "input": 0.144, + "output": 0.574 }, "type": "chat" }, { - "id": "microsoft/phi-3-medium-128k-instruct", - "name": "Phi-3-medium instruct (128k)", - "display_name": "Phi-3-medium instruct (128k)", + "id": "deepseek-r1-distill-qwen-7b", + "name": "DeepSeek R1 Distill Qwen 7B", + "display_name": "DeepSeek R1 Distill Qwen 7B", "modalities": { "input": [ "text" @@ -148371,8 +156811,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -148381,88 +156821,89 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0, - "output": 0 + "input": 0.072, + "output": 0.144 }, "type": "chat" }, { - "id": "microsoft/phi-4", - "name": "Phi-4", - "display_name": "Phi-4", + "id": "qwen-vl-max", + "name": "Qwen-VL Max", + "display_name": "Qwen-VL Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-04-08", + "last_updated": "2025-08-13", "cost": { - "input": 0, - "output": 0 + "input": 0.23, + "output": 0.574 }, "type": "chat" }, { - "id": "microsoft/phi-4-multimodal-instruct", - "name": "Phi-4-multimodal-instruct", - "display_name": "Phi-4-multimodal-instruct", + "id": "qwen2-5-omni-7b", + "name": "Qwen2.5-Omni 7B", + "display_name": "Qwen2.5-Omni 7B", "modalities": { "input": [ "text", "image", - "audio" + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 32768, + "output": 2048 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2024-04", + "release_date": "2024-12", + "last_updated": "2024-12", "cost": { - "input": 0, - "output": 0 + "input": 0.087, + "output": 0.345, + "input_audio": 5.448 }, "type": "chat" }, { - "id": "microsoft/mai-ds-r1", - "name": "MAI-DS-R1", - "display_name": "MAI-DS-R1", + "id": "qwen-plus", + "name": "Qwen Plus", + "display_name": "Qwen Plus", "modalities": { "input": [ "text" @@ -148472,30 +156913,53 @@ ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-09-11", "cost": { - "input": 0, - "output": 0 + "input": 0.115, + "output": 0.287, + "reasoning": 1.147 }, "type": "chat" }, { - "id": "cohere/cohere-command-r-08-2024", - "name": "Cohere Command R 08-2024", - "display_name": "Cohere Command R 08-2024", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -148505,40 +156969,53 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 202752, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-08-01", - "last_updated": "2024-08-01", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0, - "output": 0 + "input": 0.86, + "output": 3.15 }, "type": "chat" }, { - "id": "cohere/cohere-command-a", - "name": "Cohere Command A", - "display_name": "Cohere Command A", + "id": "kimi-k2.6", + "name": "Moonshot Kimi K2.6", + "display_name": "Moonshot Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -148546,21 +157023,32 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0, - "output": 0 + "input": 0.929, + "output": 3.858 }, "type": "chat" }, { - "id": "cohere/cohere-command-r-plus", - "name": "Cohere Command R+", - "display_name": "Cohere Command R+", + "id": "qwen2-5-coder-7b-instruct", + "name": "Qwen2.5-Coder 7B Instruct", + "display_name": "Qwen2.5-Coder 7B Instruct", "modalities": { "input": [ "text" @@ -148570,8 +157058,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -148579,20 +157067,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-04-04", - "last_updated": "2024-08-01", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-11", + "last_updated": "2024-11", "cost": { - "input": 0, - "output": 0 + "input": 0.144, + "output": 0.287 }, "type": "chat" }, { - "id": "cohere/cohere-command-r", - "name": "Cohere Command R", - "display_name": "Cohere Command R", + "id": "qwen3-14b", + "name": "Qwen3 14B", + "display_name": "Qwen3 14B", "modalities": { "input": [ "text" @@ -148602,30 +157090,47 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-03-11", - "last_updated": "2024-08-01", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0, - "output": 0 + "input": 0.144, + "output": 0.574, + "reasoning": 1.434 }, "type": "chat" }, { - "id": "cohere/cohere-command-r-plus-08-2024", - "name": "Cohere Command R+ 08-2024", - "display_name": "Cohere Command R+ 08-2024", + "id": "deepseek-v3-2-exp", + "name": "DeepSeek V3.2 Exp", + "display_name": "DeepSeek V3.2 Exp", "modalities": { "input": [ "text" @@ -148635,8 +157140,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -148645,19 +157150,18 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-08-01", - "last_updated": "2024-08-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0, - "output": 0 + "input": 0.287, + "output": 0.431 }, "type": "chat" }, { - "id": "xai/grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", "modalities": { "input": [ "text" @@ -148667,63 +157171,76 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-09", - "last_updated": "2024-12-09", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0, - "output": 0 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "xai/grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "kimi/kimi-k2.5", + "name": "kimi/kimi-k2.5", + "display_name": "kimi/kimi-k2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-09", - "last_updated": "2024-12-09", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "openai/o1-mini", - "name": "OpenAI o1-mini", - "display_name": "OpenAI o1-mini", + "id": "siliconflow/deepseek-r1-0528", + "name": "siliconflow/deepseek-r1-0528", + "display_name": "siliconflow/deepseek-r1-0528", "modalities": { "input": [ "text" @@ -148733,11 +157250,11 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 163840, + "output": 32768 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -148745,114 +157262,96 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-09-12", - "last_updated": "2024-12-17", + "release_date": "2025-05-28", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.5, + "output": 2.18 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "siliconflow/deepseek-v3-0324", + "name": "siliconflow/deepseek-v3-0324", + "display_name": "siliconflow/deepseek-v3-0324", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2024-12-26", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "OpenAI o4-mini", - "display_name": "OpenAI o4-mini", + "id": "siliconflow/deepseek-v3.2", + "name": "siliconflow/deepseek-v3.2", + "display_name": "siliconflow/deepseek-v3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 163840, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "release_date": "2025-12-03", + "last_updated": "2025-12-03", "cost": { - "input": 0, - "output": 0 + "input": 0.27, + "output": 0.42 }, "type": "chat" }, { - "id": "openai/o1-preview", - "name": "OpenAI o1-preview", - "display_name": "OpenAI o1-preview", + "id": "siliconflow/deepseek-v3.1-terminus", + "name": "siliconflow/deepseek-v3.1-terminus", + "display_name": "siliconflow/deepseek-v3.1-terminus", "modalities": { "input": [ "text" @@ -148862,59 +157361,43 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 163840, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": false, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "release_date": "2025-09-29", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "openai/o1", - "name": "OpenAI o1", - "display_name": "OpenAI o1", + "id": "MiniMax/MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 204800, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -148922,32 +157405,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-09-12", - "last_updated": "2024-12-17", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "openai/o3-mini", - "name": "OpenAI o3-mini", - "display_name": "OpenAI o3-mini", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -148957,11 +157438,11 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1000000, + "output": 384000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -148969,80 +157450,44 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0, - "output": 0 + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "openai/gpt-4.1-nano", - "name": "GPT-4.1-nano", - "display_name": "GPT-4.1-nano", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - }, - { - "id": "openai/o3", - "name": "OpenAI o3", - "display_name": "OpenAI o3", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 100000 - }, - "temperature": false, - "tool_call": false, "reasoning": { "supported": true, "default": true @@ -149050,99 +157495,78 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0, - "output": 0 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "qwen3-coder-plus-2025-09-23", + "name": "Qwen3 Coder Plus 2025 09 23", + "display_name": "Qwen3 Coder Plus 2025 09 23", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": false, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "qwen3-coder-plus-2025-07-22", + "name": "Qwen3 Coder Plus 2025 07 22", + "display_name": "Qwen3 Coder Plus 2025 07 22", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": false, "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1-mini", - "display_name": "GPT-4.1-mini", + "id": "qwen-vl-ocr-latest", + "name": "Qwen Vl Ocr Latest", + "display_name": "Qwen Vl Ocr Latest", "modalities": { "input": [ "text", @@ -149153,29 +157577,21 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 34096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": false, "type": "chat" }, { - "id": "meta/llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout 17B 16E Instruct", - "display_name": "Llama 4 Scout 17B 16E Instruct", + "id": "qvq-max-2025-05-15", + "name": "Qvq Max 2025 05 15", + "display_name": "Qvq Max 2025 05 15", "modalities": { "input": [ "text", @@ -149186,30 +157602,27 @@ ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 16384, + "min": 0, + "max": 16384 + } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "meta/meta-llama-3.1-8b-instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", + "id": "qwen-turbo-latest", + "name": "Qwen Turbo Latest", + "display_name": "Qwen Turbo Latest", "modalities": { "input": [ "text" @@ -149219,30 +157632,44 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "meta/llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "qwen-turbo-2024-09-19", + "name": "Qwen Turbo 2024 09 19", + "display_name": "Qwen Turbo 2024 09 19", "modalities": { "input": [ "text" @@ -149252,30 +157679,21 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "meta/meta-llama-3-70b-instruct", - "name": "Meta-Llama-3-70B-Instruct", - "display_name": "Meta-Llama-3-70B-Instruct", + "id": "qwen-flash-2025-07-28", + "name": "Qwen Flash 2025 07 28", + "display_name": "Qwen Flash 2025 07 28", "modalities": { "input": [ "text" @@ -149285,100 +157703,115 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "meta/llama-3.2-90b-vision-instruct", - "name": "Llama-3.2-90B-Vision-Instruct", - "display_name": "Llama-3.2-90B-Vision-Instruct", + "id": "qwen-plus-latest", + "name": "Qwen Plus Latest", + "display_name": "Qwen Plus Latest", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "meta/llama-3.2-11b-vision-instruct", - "name": "Llama-3.2-11B-Vision-Instruct", - "display_name": "Llama-3.2-11B-Vision-Instruct", + "id": "qwen-plus-2024-09-19", + "name": "Qwen Plus 2024 09 19", + "display_name": "Qwen Plus 2024 09 19", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "meta/meta-llama-3.1-405b-instruct", - "name": "Meta-Llama-3.1-405B-Instruct", - "display_name": "Meta-Llama-3.1-405B-Instruct", + "id": "qwen-plus-2025-07-14", + "name": "Qwen Plus 2025 07 14", + "display_name": "Qwen Plus 2025 07 14", "modalities": { "input": [ "text" @@ -149388,30 +157821,44 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "meta/meta-llama-3.1-70b-instruct", - "name": "Meta-Llama-3.1-70B-Instruct", - "display_name": "Meta-Llama-3.1-70B-Instruct", + "id": "qwen-plus-2025-09-11", + "name": "Qwen Plus 2025 09 11", + "display_name": "Qwen Plus 2025 09 11", "modalities": { "input": [ "text" @@ -149421,97 +157868,74 @@ ] }, "limit": { - "context": 128000, + "context": 1000000, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - }, - { - "id": "meta/meta-llama-3-8b-instruct", - "name": "Meta-Llama-3-8B-Instruct", - "display_name": "Meta-Llama-3-8B-Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "limit": { - "context": 8192, - "output": 2048 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, - "temperature": true, - "tool_call": true, - "reasoning": { + "search": { "supported": true, - "default": true + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "meta/llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama 4 Maverick 17B 128E Instruct FP8", - "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", + "id": "qwen-max-latest", + "name": "Qwen Max Latest", + "display_name": "Qwen Max Latest", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { + "supported": false + }, + "search": { "supported": true, - "default": true + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "core42/jais-30b-chat", - "name": "JAIS 30b Chat", - "display_name": "JAIS 30b Chat", + "id": "qwen-max-2024-09-19", + "name": "Qwen Max 2024 09 19", + "display_name": "Qwen Max 2024 09 19", "modalities": { "input": [ "text" @@ -149521,30 +157945,27 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-03", - "release_date": "2023-08-30", - "last_updated": "2023-08-30", - "cost": { - "input": 0, - "output": 0 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "mistral-ai/mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "qwen-max-2024-04-28", + "name": "Qwen Max 2024 04 28", + "display_name": "Qwen Max 2024 04 28", "modalities": { "input": [ "text" @@ -149554,30 +157975,21 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 8000, + "output": 2000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-03", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "mistral-ai/ministral-3b", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "qwen-max-2024-04-03", + "name": "Qwen Max 2024 04 03", + "display_name": "Qwen Max 2024 04 03", "modalities": { "input": [ "text" @@ -149587,30 +157999,21 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 8000, + "output": 2000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-03", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "mistral-ai/mistral-large-2411", - "name": "Mistral Large 24.11", - "display_name": "Mistral Large 24.11", + "id": "qwen-max-2025-01-25", + "name": "Qwen Max 2025 01 25", + "display_name": "Qwen Max 2025 01 25", "modalities": { "input": [ "text" @@ -149620,98 +158023,98 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { + "supported": false + }, + "search": { "supported": true, - "default": true + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "mistral-ai/mistral-small-2503", - "name": "Mistral Small 3.1", - "display_name": "Mistral Small 3.1", + "id": "qwen3-max-2025-09-23", + "name": "Qwen3 Max 20250923", + "display_name": "Qwen3 Max 20250923", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { + "supported": false + }, + "search": { "supported": true, - "default": true + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-03-01", - "last_updated": "2025-03-01", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "mistral-ai/mistral-medium-2505", - "name": "Mistral Medium 3 (25.05)", - "display_name": "Mistral Medium 3 (25.05)", + "id": "qwen3-max-preview", + "name": "Qwen3 Max Preview", + "display_name": "Qwen3 Max Preview", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { "supported": true, - "default": true + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "mistral-ai/codestral-2501", - "name": "Codestral 25.01", - "display_name": "Codestral 25.01", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ "text" @@ -149721,39 +158124,38 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" - } - ] - }, - "neuralwatt": { - "id": "neuralwatt", - "name": "Neuralwatt", - "display_name": "Neuralwatt", - "api": "https://api.neuralwatt.com/v1", - "doc": "https://portal.neuralwatt.com/docs", - "models": [ + }, { - "id": "glm-5-fast", - "name": "GLM 5 Fast", - "display_name": "GLM 5 Fast", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -149763,8 +158165,8 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -149772,51 +158174,36 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-07", - "last_updated": "2026-04-07", - "cost": { - "input": 1.1, - "output": 3.6 - }, "type": "chat" }, { - "id": "kimi-k2.6-fast", - "name": "Kimi K2.6 Fast", - "display_name": "Kimi K2.6 Fast", + "id": "qwen3-30b-a3b-instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", - "cost": { - "input": 0.69, - "output": 3.22 - }, + "attachment": false, "type": "chat" }, { - "id": "qwen3.5-397b-fast", - "name": "Qwen3.5 397B Fast", - "display_name": "Qwen3.5 397B Fast", + "id": "qwen3-30b-a3b-thinking-2507", + "name": "Qwen3 30B A3B Thinking 2507", + "display_name": "Qwen3 30B A3B Thinking 2507", "modalities": { "input": [ "text" @@ -149826,13 +158213,19 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { @@ -149846,19 +158239,12 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-01", - "last_updated": "2026-02-01", - "cost": { - "input": 0.69, - "output": 4.14 - }, "type": "chat" }, { - "id": "glm-5.1-fast", - "name": "GLM 5.1 Fast", - "display_name": "GLM 5.1 Fast", + "id": "qwen3-30b-a3b", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ "text" @@ -149868,32 +158254,41 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-07", - "last_updated": "2026-04-07", - "cost": { - "input": 1.1, - "output": 3.6 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "qwen3.6-35b-fast", - "name": "Qwen3.6 35B Fast", - "display_name": "Qwen3.6 35B Fast", + "id": "qwen3-4b", + "name": "Qwen3 4B", + "display_name": "Qwen3 4B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -149901,12 +158296,18 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "extra_capabilities": { "reasoning": { @@ -149919,52 +158320,54 @@ ] } }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", - "cost": { - "input": 0.05, - "output": 0.1 - }, + "attachment": false, "type": "chat" }, { - "id": "kimi-k2.5-fast", - "name": "Kimi K2.5 Fast", - "display_name": "Kimi K2.5 Fast", + "id": "qwen3-1.7b", + "name": "Qwen3 1.7B", + "display_name": "Qwen3 1.7B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 30720, + "min": 0, + "max": 30720 + } }, - "attachment": true, - "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", - "cost": { - "input": 0.52, - "output": 2.59 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "Qwen/Qwen3.5-397B-A17B-FP8", - "name": "Qwen3.5 397B A17B FP8", - "display_name": "Qwen3.5 397B A17B FP8", + "id": "qwen3-0.6b", + "name": "Qwen3 0.6B", + "display_name": "Qwen3 0.6B", "modalities": { "input": [ "text" @@ -149974,14 +158377,19 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 30720, + "min": 0, + "max": 30720 + } }, "extra_capabilities": { "reasoning": { @@ -149995,19 +158403,12 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-01", - "last_updated": "2026-02-01", - "cost": { - "input": 0.69, - "output": 4.14 - }, "type": "chat" }, { - "id": "Qwen/Qwen3.6-35B-A3B", - "name": "Qwen3.6 35B A3B", - "display_name": "Qwen3.6 35B A3B", + "id": "qwen3-vl-plus-2025-09-23", + "name": "Qwen3 VL Plus 2025 09 23", + "display_name": "Qwen3 VL Plus 2025 09 23", "modalities": { "input": [ "text", @@ -150018,14 +158419,19 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { @@ -150038,20 +158444,13 @@ ] } }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", - "cost": { - "input": 0.05, - "output": 0.1 - }, + "attachment": false, "type": "chat" }, { - "id": "zai-org/GLM-5.1-FP8", - "name": "GLM 5.1 FP8", - "display_name": "GLM 5.1 FP8", + "id": "qwq-plus-latest", + "name": "QwQ Plus Latest", + "display_name": "QwQ Plus Latest", "modalities": { "input": [ "text" @@ -150061,14 +158460,19 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 32768, + "min": 0, + "max": 32768 + } }, "extra_capabilities": { "reasoning": { @@ -150081,52 +158485,69 @@ ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-07", - "last_updated": "2026-04-07", - "cost": { - "input": 1.1, - "output": 3.6 + "search": { + "supported": false }, + "attachment": false, "type": "chat" - }, + } + ] + }, + "drun": { + "id": "drun", + "name": "D.Run (China)", + "display_name": "D.Run (China)", + "api": "https://chat.d.run/v1", + "doc": "https://www.d.run", + "models": [ { - "id": "mistralai/Devstral-Small-2-24B-Instruct-2512", - "name": "Devstral Small 2 24B Instruct 2512", - "display_name": "Devstral Small 2 24B Instruct 2512", + "id": "public/deepseek-r1", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "knowledge": "2024-12", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.12, - "output": 0.35 + "input": 0.55, + "output": 2.2 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "public/deepseek-v3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ "text" @@ -150136,46 +158557,40 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-07", + "release_date": "2024-12-26", + "last_updated": "2024-12-26", "cost": { - "input": 0.03, - "output": 0.16 + "input": 0.28, + "output": 1.1 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "public/minimax-m25", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -150194,32 +158609,40 @@ ] } }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "attachment": false, + "open_weights": false, + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 0.69, - "output": 3.22 + "input": 0.29, + "output": 1.16 }, "type": "chat" - }, + } + ] + }, + "huggingface": { + "id": "huggingface", + "name": "Hugging Face", + "display_name": "Hugging Face", + "api": "https://router.huggingface.co/v1", + "doc": "https://huggingface.co/docs/inference-providers", + "models": [ { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, @@ -150238,20 +158661,21 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "knowledge": "2025-05", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.52, - "output": 2.59 + "input": 3, + "output": 5 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ "text" @@ -150261,8 +158685,8 @@ ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -150272,37 +158696,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.35, - "output": 1.38 + "input": 0.28, + "output": 0.4 }, "type": "chat" - } - ] - }, - "togetherai": { - "id": "togetherai", - "name": "Together AI", - "display_name": "Together AI", - "doc": "https://docs.together.ai/docs/serverless-models", - "models": [ + }, { - "id": "essentialai/Rnj-1-Instruct", - "name": "Rnj-1 Instruct", - "display_name": "Rnj-1 Instruct", + "id": "moonshotai/Kimi-K2-Instruct", + "name": "Kimi-K2-Instruct", + "display_name": "Kimi-K2-Instruct", "modalities": { "input": [ "text" @@ -150312,8 +158723,8 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -150323,22 +158734,21 @@ "attachment": false, "open_weights": true, "knowledge": "2024-10", - "release_date": "2025-12-05", - "last_updated": "2025-12-05", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", "cost": { - "input": 0.15, - "output": 0.15 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-397B-A17B", - "name": "Qwen3.5 397B A17B", - "display_name": "Qwen3.5 397B A17B", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "Kimi-K2-Thinking", + "display_name": "Kimi-K2-Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -150346,7 +158756,7 @@ }, "limit": { "context": 262144, - "output": 130000 + "output": 262144 }, "temperature": true, "tool_call": true, @@ -150367,29 +158777,33 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { "input": 0.6, - "output": 3.6 + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "Qwen/Qwen3.6-Plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi-K2.6", + "display_name": "Kimi-K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 500000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -150408,23 +158822,27 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-04-30", - "last_updated": "2026-04-30", + "knowledge": "2025-01", + "release_date": "2026-04-20", + "last_updated": "2026-04-20", "cost": { - "input": 0.5, - "output": 3 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-Next-FP8", - "name": "Qwen3 Coder Next FP8", - "display_name": "Qwen3 Coder Next FP8", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi-K2.5", + "display_name": "Kimi-K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -150440,21 +158858,33 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "knowledge": "2026-02-03", - "release_date": "2026-02-03", - "last_updated": "2026-02-03", + "knowledge": "2025-01", + "release_date": "2026-01-01", + "last_updated": "2026-01-01", "cost": { - "input": 0.5, - "output": 1.2 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507-tput", - "name": "Qwen3 235B A22B Instruct 2507 FP8", - "display_name": "Qwen3 235B A22B Instruct 2507 FP8", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi-K2-Instruct-0905", + "display_name": "Kimi-K2-Instruct-0905", "modalities": { "input": [ "text" @@ -150465,29 +158895,28 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "knowledge": "2024-10", + "release_date": "2025-09-04", + "last_updated": "2025-09-04", "cost": { - "input": 0.2, - "output": 0.6 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "zai-org/GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -150497,29 +158926,42 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 2, - "output": 2 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "zai-org/GLM-4.7-Flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ "text" @@ -150529,8 +158971,8 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -150540,24 +158982,30 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "knowledge": "2025-11", - "release_date": "2026-04-07", - "last_updated": "2026-04-07", + "knowledge": "2025-04", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 1.4, - "output": 4.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct-Turbo", - "name": "Llama 3.3 70B", - "display_name": "Llama 3.3 70B", + "id": "zai-org/GLM-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -150567,29 +159015,41 @@ ] }, "limit": { - "context": 131072, + "context": 202752, "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.88, - "output": 0.88 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "zai-org/GLM-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -150599,7 +159059,7 @@ ] }, "limit": { - "context": 131072, + "context": 202752, "output": 131072 }, "temperature": true, @@ -150608,21 +159068,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-29", + "release_date": "2026-04-03", + "last_updated": "2026-04-03", "cost": { - "input": 1.25, - "output": 1.25 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "XiaomiMiMo/MiMo-V2-Flash", + "name": "MiMo-V2-Flash", + "display_name": "MiMo-V2-Flash", "modalities": { "input": [ "text" @@ -150632,41 +159103,30 @@ ] }, "limit": { - "context": 163839, - "output": 163839 + "context": 262144, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-12-26", - "last_updated": "2025-03-24", + "knowledge": "2024-12", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 3, - "output": 7 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3-1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "MiniMaxAI/MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -150676,7 +159136,7 @@ ] }, "limit": { - "context": 131072, + "context": 204800, "output": 131072 }, "temperature": true, @@ -150685,21 +159145,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "knowledge": "2025-10", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.6, - "output": 1.7 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V4-Pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "MiniMaxAI/MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ "text" @@ -150709,8 +159180,8 @@ ] }, "limit": { - "context": 512000, - "output": 384000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -150731,19 +159202,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 2.1, - "output": 4.4, - "cache_read": 0.2 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -150753,7 +159224,7 @@ ] }, "limit": { - "context": 131072, + "context": 204800, "output": 131072 }, "temperature": true, @@ -150764,28 +159235,33 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "google/gemma-4-31B-it", - "name": "Gemma 4 31B Instruct", - "display_name": "Gemma 4 31B Instruct", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen3-235B-A22B-Thinking-2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -150801,26 +159277,35 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-07", - "last_updated": "2026-04-07", + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.3, + "output": 3 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen3-Next-80B-A3B-Instruct", + "display_name": "Qwen3-Next-80B-A3B-Instruct", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" @@ -150828,39 +159313,31 @@ }, "limit": { "context": 262144, - "output": 131000 + "output": 66536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "knowledge": "2025-04", + "release_date": "2025-09-11", + "last_updated": "2025-09-11", "cost": { - "input": 1.2, - "output": 4.5, - "cache_read": 0.2 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "name": "Qwen3-Next-80B-A3B-Thinking", + "display_name": "Qwen3-Next-80B-A3B-Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -150868,13 +159345,12 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -150889,30 +159365,31 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "knowledge": "2025-04", + "release_date": "2025-09-11", + "last_updated": "2025-09-11", "cost": { - "input": 0.5, - "output": 2.8 + "input": 0.3, + "output": 2 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "Qwen/Qwen3.5-397B-A17B", + "name": "Qwen3.5-397B-A17B", + "display_name": "Qwen3.5-397B-A17B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -150922,24 +159399,30 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2025-04", + "release_date": "2026-02-01", + "last_updated": "2026-02-01", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "Qwen/Qwen3-Embedding-4B", + "name": "Qwen 3 Embedding 4B", + "display_name": "Qwen 3 Embedding 4B", "modalities": { "input": [ "text" @@ -150949,213 +159432,136 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 32000, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.01, + "output": 0 }, - "type": "chat" - } - ] - }, - "qihang-ai": { - "id": "qihang-ai", - "name": "QiHang", - "display_name": "QiHang", - "api": "https://api.qhaigc.net/v1", - "doc": "https://www.qhaigc.net/docs", - "models": [ + "type": "embedding" + }, { - "id": "claude-opus-4-5-20251101", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "Qwen/Qwen3-Coder-Next", + "name": "Qwen3-Coder-Next", + "display_name": "Qwen3-Coder-Next", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-03", + "last_updated": "2026-02-03", "cost": { - "input": 0.71, - "output": 3.57 + "input": 0.2, + "output": 1.5 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen3-Coder-480B-A35B-Instruct", + "display_name": "Qwen3-Coder-480B-A35B-Instruct", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 66536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.07, - "output": 0.43, - "context_over_200k": { - "input": 0.07, - "output": 0.43 - } + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5-Mini", - "display_name": "GPT-5-Mini", + "id": "Qwen/Qwen3-Embedding-8B", + "name": "Qwen 3 Embedding 8B", + "display_name": "Qwen 3 Embedding 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.04, - "output": 0.29 + "input": 0.01, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "deepseek-ai/DeepSeek-V4-Pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65000 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, @@ -151166,126 +159572,119 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.57, - "output": 3.43 + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 }, "type": "chat" - }, + } + ] + }, + "umans-ai-coding-plan": { + "id": "umans-ai-coding-plan", + "name": "Umans AI Coding Plan", + "display_name": "Umans AI Coding Plan", + "api": "https://api.code.umans.ai/v1", + "doc": "https://app.umans.ai/offers/code/docs", + "models": [ { - "id": "claude-sonnet-4-5-20250929", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "umans-qwen3.6-35b-a3b", + "name": "Qwen3.6 35B A3B", + "display_name": "Qwen3.6 35B A3B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": true, + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.43, - "output": 2.14 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "umans-glm-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.25, - "output": 2 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "umans-coder", + "name": "Umans Coder", + "display_name": "Umans Coder", "modalities": { "input": [ "text", @@ -151296,8 +159695,8 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 262144 }, "temperature": false, "tool_call": true, @@ -151308,128 +159707,106 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.14, - "output": 1.14 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "umans-flash", + "name": "Umans Flash", + "display_name": "Umans Flash", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "open_weights": true, + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.09, - "output": 0.71, - "context_over_200k": { - "input": 0.09, - "output": 0.71 - } + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "umans-kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-10-01", - "last_updated": "2025-10-01", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.14, - "output": 0.71 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" } @@ -151478,16 +159855,16 @@ } ] }, - "anthropic": { - "id": "anthropic", - "name": "Anthropic", - "display_name": "Anthropic", - "doc": "https://docs.anthropic.com/en/docs/about-claude/models", + "gitlab": { + "id": "gitlab", + "name": "GitLab Duo", + "display_name": "GitLab Duo", + "doc": "https://docs.gitlab.com/user/duo_agent_platform/", "models": [ { - "id": "claude-3-sonnet-20240229", - "name": "Claude Sonnet 3", - "display_name": "Claude Sonnet 3", + "id": "duo-chat-gpt-5-2-codex", + "name": "Agentic Chat (GPT-5.2 Codex)", + "display_name": "Agentic Chat (GPT-5.2 Codex)", "modalities": { "input": [ "text", @@ -151499,31 +159876,30 @@ ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-04", - "last_updated": "2024-03-04", + "knowledge": "2025-08-31", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5 (latest)", - "display_name": "Claude Haiku 4.5 (latest)", + "id": "duo-chat-haiku-4-5", + "name": "Agentic Chat (Claude Haiku 4.5)", + "display_name": "Agentic Chat (Claude Haiku 4.5)", "modalities": { "input": [ "text", @@ -151544,28 +159920,23 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": true, "open_weights": false, "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2026-01-08", + "last_updated": "2026-01-08", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "claude-opus-4-5-20251101", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "duo-chat-opus-4-6", + "name": "Agentic Chat (Claude Opus 4.6)", + "display_name": "Agentic Chat (Claude Opus 4.6)", "modalities": { "input": [ "text", @@ -151577,7 +159948,7 @@ ] }, "limit": { - "context": 200000, + "context": 1000000, "output": 64000 }, "temperature": true, @@ -151588,57 +159959,55 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "claude-3-opus-20240229", - "name": "Claude Opus 3", - "display_name": "Claude Opus 3", + "id": "duo-chat-gpt-5-2", + "name": "Agentic Chat (GPT-5.2)", + "display_name": "Agentic Chat (GPT-5.2)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", + "knowledge": "2025-08-31", + "release_date": "2026-01-23", + "last_updated": "2026-01-23", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-3-5-haiku-20241022", - "name": "Claude Haiku 3.5", - "display_name": "Claude Haiku 3.5", + "id": "duo-chat-gpt-5-3-codex", + "name": "Agentic Chat (GPT-5.3 Codex)", + "display_name": "Agentic Chat (GPT-5.3 Codex)", "modalities": { "input": [ "text", @@ -151650,31 +160019,64 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-3-5-sonnet-20241022", - "name": "Claude Sonnet 3.5 v2", - "display_name": "Claude Sonnet 3.5 v2", + "id": "duo-chat-gpt-5-1", + "name": "Agentic Chat (GPT-5.1)", + "display_name": "Agentic Chat (GPT-5.1)", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + }, + { + "id": "duo-chat-opus-4-5", + "name": "Agentic Chat (Claude Opus 4.5)", + "display_name": "Agentic Chat (Claude Opus 4.5)", "modalities": { "input": [ "text", @@ -151687,30 +160089,31 @@ }, "limit": { "context": 200000, - "output": 8192 + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2025-03-31", + "release_date": "2026-01-08", + "last_updated": "2026-01-08", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "duo-chat-opus-4-7", + "name": "Agentic Chat (Claude Opus 4.7)", + "display_name": "Agentic Chat (Claude Opus 4.7)", "modalities": { "input": [ "text", @@ -151725,55 +160128,29 @@ "context": 1000000, "output": 64000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "claude-opus-4-0", - "name": "Claude Opus 4 (latest)", - "display_name": "Claude Opus 4 (latest)", + "id": "duo-chat-sonnet-4-5", + "name": "Agentic Chat (Claude Sonnet 4.5)", + "display_name": "Agentic Chat (Claude Sonnet 4.5)", "modalities": { "input": [ "text", @@ -151786,7 +160163,7 @@ }, "limit": { "context": 200000, - "output": 32000 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -151796,133 +160173,103 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-07-31", + "release_date": "2026-01-08", + "last_updated": "2026-01-08", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "duo-chat-gpt-5-4-nano", + "name": "Agentic Chat (GPT-5.4 Nano)", + "display_name": "Agentic Chat (GPT-5.4 Nano)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-3-haiku-20240307", - "name": "Claude Haiku 3", - "display_name": "Claude Haiku 3", + "id": "duo-chat-gpt-5-codex", + "name": "Agentic Chat (GPT-5 Codex)", + "display_name": "Agentic Chat (GPT-5 Codex)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-13", - "last_updated": "2024-03-13", + "knowledge": "2024-09-30", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "duo-chat-gpt-5-4-mini", + "name": "Agentic Chat (GPT-5.4 Mini)", + "display_name": "Agentic Chat (GPT-5.4 Mini)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -151930,57 +160277,53 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-3-5-haiku-latest", - "name": "Claude Haiku 3.5 (latest)", - "display_name": "Claude Haiku 3.5 (latest)", + "id": "duo-chat-gpt-5-mini", + "name": "Agentic Chat (GPT-5 Mini)", + "display_name": "Agentic Chat (GPT-5 Mini)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2024-05-30", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-opus-4-1", - "name": "Claude Opus 4.1 (latest)", - "display_name": "Claude Opus 4.1 (latest)", + "id": "duo-chat-sonnet-4-6", + "name": "Agentic Chat (Claude Sonnet 4.6)", + "display_name": "Agentic Chat (Claude Sonnet 4.6)", "modalities": { "input": [ "text", @@ -151992,8 +160335,8 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -152001,28 +160344,23 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "claude-sonnet-4-0", - "name": "Claude Sonnet 4 (latest)", - "display_name": "Claude Sonnet 4 (latest)", + "id": "duo-chat-gpt-5-5", + "name": "Agentic Chat (GPT-5.5)", + "display_name": "Agentic Chat (GPT-5.5)", "modalities": { "input": [ "text", @@ -152034,37 +160372,30 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-08-31", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-3-5-sonnet-20240620", - "name": "Claude Sonnet 3.5", - "display_name": "Claude Sonnet 3.5", + "id": "duo-chat-gpt-5-4", + "name": "Agentic Chat (GPT-5.4)", + "display_name": "Agentic Chat (GPT-5.4)", "modalities": { "input": [ "text", @@ -152076,44 +160407,85 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-06-20", - "last_updated": "2024-06-20", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + } + ] + }, + "nebius": { + "id": "nebius", + "name": "Nebius Token Factory", + "display_name": "Nebius Token Factory", + "api": "https://api.tokenfactory.nebius.com/v1", + "doc": "https://docs.tokenfactory.nebius.com/", + "models": [ + { + "id": "deepseek-ai/DeepSeek-V3.2-fast", + "name": "DeepSeek-V3.2-fast", + "display_name": "DeepSeek-V3.2-fast", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2026-05-07", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.4, + "output": 2, + "cache_read": 0.04, + "cache_write": 0.5 }, "type": "chat" }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5 (latest)", - "display_name": "Claude Opus 4.5 (latest)", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 163000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -152123,39 +160495,45 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "attachment": false, + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2026-01-20", + "last_updated": "2026-02-04", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.3, + "output": 0.45, + "reasoning": 0.45, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "claude-opus-4-1-20250805", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "moonshotai/Kimi-K2.5-fast", + "name": "Kimi-K2.5-fast", + "display_name": "Kimi-K2.5-fast", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -152163,36 +160541,46 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-12-15", + "last_updated": "2026-02-04", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.5, + "output": 2.5, + "cache_read": 0.05, + "cache_write": 0.625 }, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi-K2.5", + "display_name": "Kimi-K2.5", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -152200,36 +160588,46 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-12-15", + "last_updated": "2026-02-04", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.5, + "output": 2.5, + "reasoning": 2.5, + "cache_read": 0.05, + "cache_write": 0.625 }, "type": "chat" }, { - "id": "claude-sonnet-4-20250514", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "openai/gpt-oss-120b-fast", + "name": "gpt-oss-120b-fast", + "display_name": "gpt-oss-120b-fast", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 8000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -152237,91 +160635,73 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-06-10", + "last_updated": "2026-05-07", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.1, + "output": 0.5, + "cache_read": 0.01, + "cache_write": 0.125 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "openai/gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2026-01-10", + "last_updated": "2026-02-04", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.15, + "output": 0.6, + "reasoning": 0.6, + "cache_read": 0.015, + "cache_write": 0.18 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-20250219", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "zai-org/GLM-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -152329,64 +160709,53 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", + "interleaved": true, + "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "knowledge": "2026-01", + "release_date": "2026-03-01", + "last_updated": "2026-03-10", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1, + "output": 3.2, + "cache_read": 0.1, + "cache_write": 1 }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5 (latest)", - "display_name": "Claude Sonnet 4.5 (latest)", + "id": "NousResearch/Hermes-4-405B", + "name": "Hermes-4-405B", + "display_name": "Hermes-4-405B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -152396,39 +160765,44 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2026-01-30", + "last_updated": "2026-02-04", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1, + "output": 3, + "reasoning": 3, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "claude-opus-4-20250514", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "NousResearch/Hermes-4-70B", + "name": "Hermes-4-70B", + "display_name": "Hermes-4-70B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -152436,32 +160810,35 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2026-01-30", + "last_updated": "2026-02-04", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.13, + "output": 0.4, + "reasoning": 0.4, + "cache_read": 0.013, + "cache_write": 0.16 }, "type": "chat" - } - ] - }, - "modelscope": { - "id": "modelscope", - "name": "ModelScope", - "display_name": "ModelScope", - "api": "https://api-inference.modelscope.cn/v1", - "doc": "https://modelscope.cn/docs/model-service/API-Inference/intro", - "models": [ + }, { - "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", - "name": "Qwen3 30B A3B Thinking 2507", - "display_name": "Qwen3 30B A3B Thinking 2507", + "id": "nvidia/Nemotron-3-Nano-Omni", + "name": "Nemotron-3-Nano-Omni", + "display_name": "Nemotron-3-Nano-Omni", "modalities": { "input": [ "text" @@ -152471,8 +160848,8 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 65536, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -152480,32 +160857,23 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2026-05-07", "cost": { - "input": 0, - "output": 0 + "input": 0.06, + "output": 0.24, + "cache_read": 0.006, + "cache_write": 0.075 }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", + "id": "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B", + "name": "Nemotron-3-Nano-30B-A3B", + "display_name": "Nemotron-3-Nano-30B-A3B", "modalities": { "input": [ "text" @@ -152515,8 +160883,8 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 32000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -152525,19 +160893,21 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "knowledge": "2025-05", + "release_date": "2025-08-10", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0 + "input": 0.06, + "output": 0.24, + "cache_read": 0.006, + "cache_write": 0.075 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "nvidia/nemotron-3-super-120b-a12b", + "name": "Nemotron-3-Super-120B-A12B", + "display_name": "Nemotron-3-Super-120B-A12B", "modalities": { "input": [ "text" @@ -152547,29 +160917,30 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 256000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2025-07-21", + "knowledge": "2026-02", + "release_date": "2026-03-11", + "last_updated": "2026-03-12", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "nvidia/Llama-3_1-Nemotron-Ultra-253B-v1", + "name": "Llama-3.1-Nemotron-Ultra-253B-v1", + "display_name": "Llama-3.1-Nemotron-Ultra-253B-v1", "modalities": { "input": [ "text" @@ -152579,8 +160950,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -152589,63 +160960,56 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-31", - "last_updated": "2025-07-31", + "knowledge": "2024-12", + "release_date": "2025-01-15", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 1.8, + "cache_read": 0.06, + "cache_write": 0.75 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen3-235B-A22B-Thinking-2507", + "id": "google/gemma-3-27b-it", + "name": "Gemma-3-27b-it", + "display_name": "Gemma-3-27b-it", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 110000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "knowledge": "2025-10", + "release_date": "2026-01-20", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.3, + "cache_read": 0.01, + "cache_write": 0.125 }, "type": "chat" }, { - "id": "ZhipuAI/GLM-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "google/gemma-2-2b-it", + "name": "Gemma-2-2b-it", + "display_name": "Gemma-2-2b-it", "modalities": { "input": [ "text" @@ -152655,30 +161019,31 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 8192, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2024-06", + "release_date": "2024-07-31", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0 + "input": 0.02, + "output": 0.06, + "cache_read": 0.002, + "cache_write": 0.025 }, "type": "chat" }, { - "id": "ZhipuAI/GLM-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" @@ -152688,44 +161053,31 @@ ] }, "limit": { - "context": 202752, - "output": 98304 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2024-12", + "release_date": "2024-07-23", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0 + "input": 0.02, + "output": 0.06, + "cache_read": 0.002, + "cache_write": 0.025 }, "type": "chat" - } - ] - }, - "hpc-ai": { - "id": "hpc-ai", - "name": "HPC-AI", - "display_name": "HPC-AI", - "api": "https://api.hpc-ai.com/inference/v1", - "doc": "https://www.hpc-ai.com/doc/docs/quickstart/", - "models": [ + }, { - "id": "zai-org/glm-5.1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -152735,41 +161087,31 @@ ] }, "limit": { - "context": 202000, - "output": 202000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "knowledge": "2025-08", + "release_date": "2025-12-05", + "last_updated": "2026-02-04", "cost": { - "input": 0.66, - "output": 2, - "cache_read": 0.12 + "input": 0.13, + "output": 0.4, + "cache_read": 0.013, + "cache_write": 0.16 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "MiniMaxAI/MiniMax-M2.5-fast", + "name": "MiniMax-M2.5-fast", + "display_name": "MiniMax-M2.5-fast", "modalities": { "input": [ "text" @@ -152779,8 +161121,8 @@ ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 8000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -152788,41 +161130,36 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-03-25", + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2026-05-07", "cost": { - "input": 0.14, - "output": 0.56, - "cache_read": 0.014 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 196608, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -152830,178 +161167,186 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2025-01-01", - "release_date": "2026-01-01", - "last_updated": "2026-03-25", + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2026-05-07", "cost": { - "input": 0.21, - "output": 1, - "cache_read": 0.03 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" - } - ] - }, - "gitlab": { - "id": "gitlab", - "name": "GitLab Duo", - "display_name": "GitLab Duo", - "doc": "https://docs.gitlab.com/user/duo_agent_platform/", - "models": [ + }, { - "id": "duo-chat-gpt-5-4-nano", - "name": "Agentic Chat (GPT-5.4 Nano)", - "display_name": "Agentic Chat (GPT-5.4 Nano)", + "id": "PrimeIntellect/INTELLECT-3", + "name": "INTELLECT-3", + "display_name": "INTELLECT-3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-10", + "release_date": "2026-01-25", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0 + "input": 0.2, + "output": 1.1, + "cache_read": 0.02, + "cache_write": 0.25 }, "type": "chat" }, { - "id": "duo-chat-gpt-5-mini", - "name": "Agentic Chat (GPT-5 Mini)", - "display_name": "Agentic Chat (GPT-5 Mini)", + "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "name": "Qwen3-Next-80B-A3B-Thinking", + "display_name": "Qwen3-Next-80B-A3B-Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2026-01-22", - "last_updated": "2026-01-22", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0 + "input": 0.15, + "output": 1.2, + "reasoning": 1.2, + "cache_read": 0.015, + "cache_write": 0.18 }, "type": "chat" }, { - "id": "duo-chat-sonnet-4-6", - "name": "Agentic Chat (Claude Sonnet 4.6)", - "display_name": "Agentic Chat (Claude Sonnet 4.6)", + "id": "Qwen/Qwen3-32B", + "name": "Qwen3-32B", + "display_name": "Qwen3-32B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.1, + "output": 0.3, + "cache_read": 0.01, + "cache_write": 0.125 }, "type": "chat" }, { - "id": "duo-chat-gpt-5-2", - "name": "Agentic Chat (GPT-5.2)", - "display_name": "Agentic Chat (GPT-5.2)", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen3-30B-A3B-Instruct-2507", + "display_name": "Qwen3-30B-A3B-Instruct-2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-01-23", - "last_updated": "2026-01-23", + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.3, + "cache_read": 0.01, + "cache_write": 0.125 }, "type": "chat" }, { - "id": "duo-chat-gpt-5-codex", - "name": "Agentic Chat (GPT-5 Codex)", - "display_name": "Agentic Chat (GPT-5 Codex)", + "id": "Qwen/Qwen2.5-VL-72B-Instruct", + "name": "Qwen2.5-VL-72B-Instruct", + "display_name": "Qwen2.5-VL-72B-Instruct", "modalities": { "input": [ "text", @@ -153012,112 +161357,121 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2026-01-22", - "last_updated": "2026-01-22", + "attachment": true, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-20", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 0.75, + "cache_read": 0.025, + "cache_write": 0.31 }, "type": "chat" }, { - "id": "duo-chat-gpt-5-1", - "name": "Agentic Chat (GPT-5.1)", - "display_name": "Agentic Chat (GPT-5.1)", + "id": "Qwen/Qwen3.5-397B-A17B-fast", + "name": "Qwen3.5-397B-A17B-fast", + "display_name": "Qwen3.5-397B-A17B-fast", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2026-01-22", - "last_updated": "2026-01-22", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-15", + "last_updated": "2026-05-07", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 3.6, + "cache_read": 0.06, + "cache_write": 0.75 }, "type": "chat" }, { - "id": "duo-chat-gpt-5-2-codex", - "name": "Agentic Chat (GPT-5.2 Codex)", - "display_name": "Agentic Chat (GPT-5.2 Codex)", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-01-22", - "last_updated": "2026-01-22", + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-10-04", "cost": { - "input": 0, - "output": 0 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "duo-chat-sonnet-4-5", - "name": "Agentic Chat (Claude Sonnet 4.5)", - "display_name": "Agentic Chat (Claude Sonnet 4.5)", + "id": "Qwen/Qwen3-Next-80B-A3B-Thinking-fast", + "name": "Qwen3-Next-80B-A3B-Thinking-fast", + "display_name": "Qwen3-Next-80B-A3B-Thinking-fast", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 8000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -153125,71 +161479,91 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2026-01-08", - "last_updated": "2026-01-08", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2026-05-07", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.15, + "output": 1.2, + "cache_read": 0.015, + "cache_write": 0.1875 }, "type": "chat" }, { - "id": "duo-chat-gpt-5-4", - "name": "Agentic Chat (GPT-5.4)", - "display_name": "Agentic Chat (GPT-5.4)", + "id": "Qwen/Qwen3.5-397B-A17B", + "name": "Qwen3.5-397B-A17B", + "display_name": "Qwen3.5-397B-A17B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 262144, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-15", + "last_updated": "2026-05-07", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 3.6, + "cache_read": 0.06, + "cache_write": 0.75 }, "type": "chat" }, { - "id": "duo-chat-haiku-4-5", - "name": "Agentic Chat (Claude Haiku 4.5)", - "display_name": "Agentic Chat (Claude Haiku 4.5)", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507-fast", + "name": "Qwen3-235B-A22B-Thinking-2507-fast", + "display_name": "Qwen3-235B-A22B-Thinking-2507-fast", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 8000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -153197,105 +161571,133 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2026-01-08", - "last_updated": "2026-01-08", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2026-05-07", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.5, + "output": 2, + "cache_read": 0.05, + "cache_write": 0.625 }, "type": "chat" }, { - "id": "duo-chat-gpt-5-3-codex", - "name": "Agentic Chat (GPT-5.3 Codex)", - "display_name": "Agentic Chat (GPT-5.3 Codex)", + "id": "Qwen/Qwen3-Embedding-8B", + "name": "Qwen3-Embedding-8B", + "display_name": "Qwen3-Embedding-8B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32768, + "output": 8192 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-10", + "release_date": "2026-01-10", + "last_updated": "2026-02-04", "cost": { - "input": 0, + "input": 0.01, "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "duo-chat-gpt-5-4-mini", - "name": "Agentic Chat (GPT-5.4 Mini)", - "display_name": "Agentic Chat (GPT-5.4 Mini)", + "id": "deepseek-ai/DeepSeek-V4-Pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 384000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0, - "output": 0 + "input": 1.75, + "output": 3.5, + "cache_read": 0.15 }, "type": "chat" - }, + } + ] + }, + "hpc-ai": { + "id": "hpc-ai", + "name": "HPC-AI", + "display_name": "HPC-AI", + "api": "https://api.hpc-ai.com/inference/v1", + "doc": "https://www.hpc-ai.com/doc/docs/quickstart/", + "models": [ { - "id": "duo-chat-opus-4-7", - "name": "Agentic Chat (Claude Opus 4.7)", - "display_name": "Agentic Chat (Claude Opus 4.7)", + "id": "moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": false, "tool_call": true, @@ -153303,36 +161705,44 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01-01", + "release_date": "2026-01-01", + "last_updated": "2026-03-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.21, + "output": 1, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "duo-chat-opus-4-5", - "name": "Agentic Chat (Claude Opus 4.5)", - "display_name": "Agentic Chat (Claude Opus 4.5)", + "id": "zai-org/glm-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 202000, + "output": 202000 }, "temperature": true, "tool_call": true, @@ -153340,28 +161750,35 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2026-01-08", - "last_updated": "2026-01-08", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-04-08", + "last_updated": "2026-04-08", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.66, + "output": 2, + "cache_read": 0.12 }, "type": "chat" }, { - "id": "duo-chat-opus-4-6", - "name": "Agentic Chat (Claude Opus 4.6)", - "display_name": "Agentic Chat (Claude Opus 4.6)", + "id": "minimax/minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -153369,7 +161786,7 @@ }, "limit": { "context": 1000000, - "output": 64000 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -153377,16 +161794,19 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-03-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.14, + "output": 0.56, + "cache_read": 0.014 }, "type": "chat" } @@ -153400,19 +161820,23 @@ "doc": "https://platform.xiaomimimo.com/#/docs", "models": [ { - "id": "mimo-v2.5-pro", - "name": "MiMo-V2.5-Pro", - "display_name": "MiMo-V2.5-Pro", + "id": "mimo-v2-omni", + "name": "MiMo-V2-Omni", + "display_name": "MiMo-V2-Omni", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 131072 }, "temperature": true, @@ -153432,41 +161856,32 @@ ] } }, - "attachment": false, - "open_weights": true, + "attachment": true, + "open_weights": false, "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2, - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0.4, + "output": 2, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "mimo-v2-omni", - "name": "MiMo-V2-Omni", - "display_name": "MiMo-V2-Omni", + "id": "mimo-v2.5-pro", + "name": "MiMo-V2.5-Pro", + "display_name": "MiMo-V2.5-Pro", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1048576, "output": 131072 }, "temperature": true, @@ -153486,36 +161901,49 @@ ] } }, - "attachment": true, - "open_weights": false, + "attachment": false, + "open_weights": true, "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08 + "input": 1, + "output": 3, + "cache_read": 0.2, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "mimo-v2.5", - "name": "MiMo-V2.5", - "display_name": "MiMo-V2.5", + "id": "mimo-v2-flash", + "name": "MiMo-V2-Flash", + "display_name": "MiMo-V2-Flash", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -153534,20 +161962,15 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08, - "context_over_200k": { - "input": 0.8, - "output": 4, - "cache_read": 0.16 - } + "input": 0.1, + "output": 0.3, + "cache_read": 0.01 }, "type": "chat" }, @@ -153593,6 +162016,17 @@ "input": 1, "output": 3, "cache_read": 0.2, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ], "context_over_200k": { "input": 2, "output": 6, @@ -153602,20 +162036,23 @@ "type": "chat" }, { - "id": "mimo-v2-flash", - "name": "MiMo-V2-Flash", - "display_name": "MiMo-V2-Flash", + "id": "mimo-v2.5", + "name": "MiMo-V2.5", + "display_name": "MiMo-V2.5", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -153634,64 +162071,81 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01 + "input": 0.4, + "output": 2, + "cache_read": 0.08, + "tiers": [ + { + "input": 0.8, + "output": 4, + "cache_read": 0.16, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 0.8, + "output": 4, + "cache_read": 0.16 + } }, "type": "chat" } ] }, - "clarifai": { - "id": "clarifai", - "name": "Clarifai", - "display_name": "Clarifai", - "api": "https://api.clarifai.com/v2/ext/openai/v1", - "doc": "https://docs.clarifai.com/compute/inference/", + "github-copilot": { + "id": "github-copilot", + "name": "GitHub Copilot", + "display_name": "GitHub Copilot", + "api": "https://api.githubcopilot.com", + "doc": "https://docs.github.com/en/copilot", "models": [ { - "id": "arcee_ai/AFM/models/trinity-mini", - "name": "Trinity Mini", - "display_name": "Trinity Mini", + "id": "claude-opus-41", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 80000, + "output": 16000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-12", - "last_updated": "2026-02-25", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.045, - "output": 0.15 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mistralai/completion/models/Ministral-3-14B-Reasoning-2512", - "name": "Ministral 3 14B Reasoning 2512", - "display_name": "Ministral 3 14B Reasoning 2512", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ "text", @@ -153702,30 +162156,29 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-01", - "last_updated": "2025-12-12", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 2.5, - "output": 1.7 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mistralai/completion/models/Ministral-3-3B-Reasoning-2512", - "name": "Ministral 3 3B Reasoning 2512", - "display_name": "Ministral 3 3B Reasoning 2512", + "id": "claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", @@ -153736,29 +162189,56 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-12", - "last_updated": "2026-02-25", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 1.039, - "output": 0.54825 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-ocr/models/DeepSeek-OCR", - "name": "DeepSeek OCR", - "display_name": "DeepSeek OCR", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", @@ -153769,39 +162249,64 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 264000, + "output": 64000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-10-20", - "last_updated": "2026-02-25", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.2, - "output": 0.7 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/chat-completion/models/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 144000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -153809,36 +162314,35 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-12-12", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.045, - "output": 0.18 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/chat-completion/models/gpt-oss-120b-high-throughput", - "name": "GPT OSS 120B High Throughput", - "display_name": "GPT OSS 120B High Throughput", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -153846,52 +162350,95 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2026-02-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.09, - "output": 0.36 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "minimaxai/chat-completion/models/MiniMax-M2_5-high-throughput", - "name": "MiniMax-M2.5 High Throughput", - "display_name": "MiniMax-M2.5 High Throughput", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1-Codex-mini", + "display_name": "GPT-5.1-Codex-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-25", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwenCoder/models/Qwen3-Coder-30B-A3B-Instruct", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ "text" @@ -153901,148 +162448,142 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-31", - "last_updated": "2026-02-12", + "open_weights": false, + "knowledge": "2025-08", + "release_date": "2025-08-27", + "last_updated": "2025-08-27", "cost": { - "input": 0.11458, - "output": 0.74812 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwenLM/models/Qwen3-30B-A3B-Thinking-2507", - "name": "Qwen3 30B A3B Thinking 2507", - "display_name": "Qwen3 30B A3B Thinking 2507", + "id": "claude-opus-4.6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 144000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-31", - "last_updated": "2026-02-25", - "cost": { - "input": 0.36, - "output": 1.3 - }, - "type": "chat" - }, - { - "id": "qwen/qwenLM/models/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 262144 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-30", - "last_updated": "2026-02-25", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.3, - "output": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "clarifai/main/models/mm-poly-8b", - "name": "MM Poly 8B", - "display_name": "MM Poly 8B", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-06", - "last_updated": "2026-02-25", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.658, - "output": 1.11 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "moonshotai/chat-completion/models/Kimi-K2_6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -154053,215 +162594,214 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, - "open_weights": true, + "open_weights": false, "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", - "cost": { - "input": 0.95, - "output": 4 - }, - "type": "chat" - } - ] - }, - "minimax-cn": { - "id": "minimax-cn", - "name": "MiniMax (minimaxi.com)", - "display_name": "MiniMax (minimaxi.com)", - "api": "https://api.minimaxi.com/anthropic/v1", - "doc": "https://platform.minimaxi.com/docs/guides/quickstart", - "models": [ - { - "id": "MiniMax-M2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 196608, - "output": 128000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 264000, + "output": 64000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "MiniMax-M2.7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "gpt-5.4-mini", + "name": "GPT-5.4 Mini", + "display_name": "GPT-5.4 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 144000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -154269,36 +162809,33 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "MiniMax-M2.5-highspeed", - "name": "MiniMax-M2.5-highspeed", - "display_name": "MiniMax-M2.5-highspeed", + "id": "gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -154308,100 +162845,152 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-13", - "last_updated": "2026-02-13", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "regolo-ai": { - "id": "regolo-ai", - "name": "Regolo AI", - "display_name": "Regolo AI", - "api": "https://api.regolo.ai/v1", - "doc": "https://docs.regolo.ai/", - "models": [ + }, { - "id": "mistral-small3.2", - "name": "Mistral Small 3.2", - "display_name": "Mistral Small 3.2", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1-Codex-max", + "display_name": "GPT-5.1-Codex-max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 120000, - "output": 120000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "knowledge": "2024-09-30", + "release_date": "2025-12-04", + "last_updated": "2025-12-04", "cost": { - "input": 0.5, - "output": 2.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-embedding-8b", - "name": "Qwen3-Embedding-8B", - "display_name": "Qwen3-Embedding-8B", + "id": "gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-01", - "last_updated": "2026-02-01", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0, + "output": 0 }, - "type": "embedding" + "type": "chat" }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash", + "display_name": "Gemini 3 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" @@ -154409,58 +162998,82 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.6, - "output": 2.7 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-reranker-4b", - "name": "Qwen3-Reranker-4B", - "display_name": "Qwen3-Reranker-4B", + "id": "claude-opus-4.5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 160000, + "output": 32000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-01", - "last_updated": "2026-02-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "cost": { - "input": 0.12, - "output": 0.12 + "input": 0, + "output": 0 }, - "type": "rerank" + "type": "chat" }, { - "id": "mistral-small-4-119b", - "name": "Mistral Small 4 119B", - "display_name": "Mistral Small 4 119B", + "id": "claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ "text", @@ -154471,8 +163084,8 @@ ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 216000, + "output": 16000 }, "temperature": true, "tool_call": true, @@ -154482,18 +163095,19 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.75, - "output": 3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3.5-122b", - "name": "Qwen3.5-122B", - "display_name": "Qwen3.5-122B", + "id": "gpt-5.1-codex", + "name": "GPT-5.1-Codex", + "display_name": "GPT-5.1-Codex", "modalities": { "input": [ "text", @@ -154504,113 +163118,117 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-01", - "last_updated": "2026-02-01", - "cost": { - "input": 0.9, - "output": 3.6 - }, - "type": "chat" - }, - { - "id": "qwen-image", - "name": "Qwen-Image", - "display_name": "Qwen-Image", - "modalities": { - "input": [ - "text" - ], - "output": [ - "image" - ] - }, - "limit": { - "context": 8192, - "output": 4096 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, "attachment": false, "open_weights": false, - "release_date": "2026-03-01", - "last_updated": "2026-03-01", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.5, - "output": 2 + "input": 0, + "output": 0 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "qwen3-coder-next", - "name": "Qwen3-Coder-Next", - "display_name": "Qwen3-Coder-Next", + "id": "gpt-5.2-codex", + "name": "GPT-5.2-Codex", + "display_name": "GPT-5.2-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-01", - "last_updated": "2026-03-01", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax 2.5", - "display_name": "MiniMax 2.5", + "id": "gpt-5-mini", + "name": "GPT-5-mini", + "display_name": "GPT-5-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 190000, + "context": 264000, "output": 64000 }, "temperature": true, @@ -154621,36 +163239,54 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-10", - "last_updated": "2026-03-10", + "knowledge": "2024-06", + "release_date": "2025-08-13", + "last_updated": "2025-08-13", "cost": { - "input": 0.8, - "output": 3.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-oss-20b", - "name": "GPT-OSS-20B", - "display_name": "GPT-OSS-20B", + "id": "gpt-5.3-codex", + "name": "GPT-5.3-Codex", + "display_name": "GPT-5.3-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -154658,23 +163294,40 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-01", - "last_updated": "2026-03-01", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0.4, - "output": 1.8 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3.5-9b", - "name": "Qwen3.5-9B", - "display_name": "Qwen3.5-9B", + "id": "claude-opus-4.7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", @@ -154685,43 +163338,58 @@ ] }, "limit": { - "context": 262144, - "output": 8192 + "context": 144000, + "output": 64000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], "interleaved": true, "summaries": true, - "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-01", - "last_updated": "2026-02-01", + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "GPT-OSS-120B", - "display_name": "GPT-OSS-120B", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -154729,7 +163397,7 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 128000 }, "temperature": true, "tool_call": true, @@ -154739,93 +163407,92 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 1, - "output": 4.2 - }, - "type": "chat" - }, - { - "id": "llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 120000, - "output": 120000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-07", - "last_updated": "2025-04-07", + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.05, - "output": 0.25 + "input": 0, + "output": 0 }, "type": "chat" } ] }, - "xiaomi-token-plan-ams": { - "id": "xiaomi-token-plan-ams", - "name": "Xiaomi Token Plan (Europe)", - "display_name": "Xiaomi Token Plan (Europe)", - "api": "https://token-plan-ams.xiaomimimo.com/v1", - "doc": "https://platform.xiaomimimo.com/#/docs", + "togetherai": { + "id": "togetherai", + "name": "Together AI", + "display_name": "Together AI", + "doc": "https://docs.together.ai/docs/serverless-models", "models": [ { - "id": "mimo-v2-tts", - "name": "MiMo-V2-TTS", - "display_name": "MiMo-V2-TTS", + "id": "deepseek-ai/DeepSeek-R1", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 16384 + "context": 163839, + "output": 163839 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2024-07", + "release_date": "2024-12-26", + "last_updated": "2025-03-24", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 7 }, "type": "chat" }, { - "id": "mimo-v2-flash", - "name": "MiMo-V2-Flash", - "display_name": "MiMo-V2-Flash", + "id": "deepseek-ai/DeepSeek-V4-Pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -154835,8 +163502,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 512000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -154857,20 +163524,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 2.1, + "output": 4.4, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "mimo-v2-pro", - "name": "MiMo-V2-Pro", - "display_name": "MiMo-V2-Pro", + "id": "deepseek-ai/DeepSeek-V3-1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text" @@ -154880,7 +163546,7 @@ ] }, "limit": { - "context": 1048576, + "context": 131072, "output": 131072 }, "temperature": true, @@ -154889,51 +163555,31 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0.6, + "output": 1.7 }, "type": "chat" }, { - "id": "mimo-v2.5", - "name": "MiMo-V2.5", - "display_name": "MiMo-V2.5", + "id": "deepseek-ai/DeepSeek-V3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 131072, "output": 131072 }, "temperature": true, @@ -154942,45 +163588,26 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "context_over_200k": { - "input": 0, - "output": 0, - "cache_read": 0 - } + "input": 1.25, + "output": 1.25 }, "type": "chat" }, { - "id": "mimo-v2-omni", - "name": "MiMo-V2-Omni", - "display_name": "MiMo-V2-Omni", + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", "image", - "audio", - "video", - "pdf" + "video" ], "output": [ "text" @@ -154988,7 +163615,7 @@ }, "limit": { "context": 262144, - "output": 131072 + "output": 131000 }, "temperature": true, "tool_call": true, @@ -154998,42 +163625,37 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 1.2, + "output": 4.5, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "mimo-v2.5-pro", - "name": "MiMo-V2.5-Pro", - "display_name": "MiMo-V2.5-Pro", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -155054,47 +163676,29 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "knowledge": "2026-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "context_over_200k": { - "input": 0, - "output": 0, - "cache_read": 0 - } + "input": 0.5, + "output": 2.8 }, "type": "chat" - } - ] - }, - "zhipuai": { - "id": "zhipuai", - "name": "Zhipu AI", - "display_name": "Zhipu AI", - "api": "https://open.bigmodel.cn/api/paas/v4", - "doc": "https://docs.z.ai/guides/overview/pricing", - "models": [ + }, { - "id": "glm-5v-turbo", - "name": "GLM-5V-Turbo", - "display_name": "GLM-5V-Turbo", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 131072, "output": 131072 }, "temperature": true, @@ -155105,31 +163709,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "attachment": false, + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 5, - "output": 22, - "cache_read": 1.2, - "cache_write": 0 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "zai-org/GLM-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -155139,7 +163736,7 @@ ] }, "limit": { - "context": 204800, + "context": 202752, "output": 131072 }, "temperature": true, @@ -155150,41 +163747,35 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "knowledge": "2025-11", + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2, - "cache_write": 0 + "input": 1.4, + "output": 4.4 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "google/gemma-4-31B-it", + "name": "Gemma 4 31B Instruct", + "display_name": "Gemma 4 31B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 262144, "output": 131072 }, "temperature": true, @@ -155193,33 +163784,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 6, - "output": 24, - "cache_read": 1.3, - "cache_write": 0 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "glm-4.7-flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "meta-llama/Llama-3.3-70B-Instruct-Turbo", + "name": "Llama 3.3 70B", + "display_name": "Llama 3.3 70B", "modalities": { "input": [ "text" @@ -155229,37 +163808,29 @@ ] }, "limit": { - "context": 200000, + "context": 131072, "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.88, + "output": 0.88 }, "type": "chat" }, { - "id": "glm-4.5-flash", - "name": "GLM-4.5-Flash", - "display_name": "GLM-4.5-Flash", + "id": "essentialai/Rnj-1-Instruct", + "name": "Rnj-1 Instruct", + "display_name": "Rnj-1 Instruct", "modalities": { "input": [ "text" @@ -155269,45 +163840,40 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2024-10", + "release_date": "2025-12-05", + "last_updated": "2025-12-05", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "glm-4.6v", - "name": "GLM-4.6V", - "display_name": "GLM-4.6V", + "id": "MiniMaxAI/MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -155315,21 +163881,32 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { "input": 0.3, - "output": 0.9 + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -155355,56 +163932,51 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "glm-4.5v", - "name": "GLM-4.5V", - "display_name": "GLM-4.5V", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, "knowledge": "2025-04", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.6, - "output": 1.8 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507-tput", + "name": "Qwen3 235B A22B Instruct 2507 FP8", + "display_name": "Qwen3 235B A22B Instruct 2507 FP8", "modalities": { "input": [ "text" @@ -155414,8 +163986,8 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -155425,21 +163997,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { "input": 0.2, - "output": 1.1, - "cache_read": 0.03, - "cache_write": 0 + "output": 0.6 }, "type": "chat" }, { - "id": "glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "Qwen/Qwen3.6-Plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ "text" @@ -155449,8 +164019,8 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 1000000, + "output": 500000 }, "temperature": true, "tool_call": true, @@ -155458,23 +164028,31 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2026-04-30", + "last_updated": "2026-04-30", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.5, + "output": 3 }, "type": "chat" }, { - "id": "glm-4.7-flashx", - "name": "GLM-4.7-FlashX", - "display_name": "GLM-4.7-FlashX", + "id": "Qwen/Qwen3-Coder-Next-FP8", + "name": "Qwen3 Coder Next FP8", + "display_name": "Qwen3 Coder Next FP8", "modalities": { "input": [ "text" @@ -155484,8 +164062,8 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -155495,32 +164073,31 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "knowledge": "2026-02-03", + "release_date": "2026-02-03", + "last_updated": "2026-02-03", "cost": { - "input": 0.07, - "output": 0.4, - "cache_read": 0.01, - "cache_write": 0 + "input": 0.5, + "output": 1.2 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "Qwen/Qwen3.5-397B-A17B", + "name": "Qwen3.5 397B A17B", + "display_name": "Qwen3.5 397B A17B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 130000 }, "temperature": true, "tool_call": true, @@ -155541,95 +164118,311 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "output": 3.6 }, "type": "chat" } ] }, - "nova": { - "id": "nova", - "name": "Nova", - "display_name": "Nova", - "api": "https://api.nova.amazon.com/v1", - "doc": "https://nova.amazon.com/dev/documentation", + "inference": { + "id": "inference", + "name": "Inference", + "display_name": "Inference", + "api": "https://inference.net/v1", + "doc": "https://inference.net/models", "models": [ { - "id": "nova-2-lite-v1", - "name": "Nova 2 Lite", - "display_name": "Nova 2 Lite", + "id": "osmosis/osmosis-structure-0.6b", + "name": "Osmosis Structure 0.6B", + "display_name": "Osmosis Structure 0.6B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4000, + "output": 2048 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0.1, + "output": 0.5 + }, + "type": "chat" + }, + { + "id": "mistral/mistral-nemo-12b-instruct", + "name": "Mistral Nemo 12B Instruct", + "display_name": "Mistral Nemo 12B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0.038, + "output": 0.1 + }, + "type": "chat" + }, + { + "id": "qwen/qwen-2.5-7b-vision-instruct", + "name": "Qwen 2.5 7B Vision Instruct", + "display_name": "Qwen 2.5 7B Vision Instruct", "modalities": { "input": [ "text", - "image", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 125000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0, - "output": 0, - "reasoning": 0 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "nova-2-pro-v1", - "name": "Nova 2 Pro", - "display_name": "Nova 2 Pro", + "id": "qwen/qwen3-embedding-4b", + "name": "Qwen 3 Embedding 4B", + "display_name": "Qwen 3 Embedding 4B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 2048 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0.01, + "output": 0 + }, + "type": "embedding" + }, + { + "id": "google/gemma-3", + "name": "Google Gemma 3", + "display_name": "Google Gemma 3", "modalities": { "input": [ "text", - "image", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 125000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-12-03", - "last_updated": "2026-01-03", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0, - "output": 0, - "reasoning": 0 + "input": 0.15, + "output": 0.3 + }, + "type": "chat" + }, + { + "id": "meta/llama-3.2-1b-instruct", + "name": "Llama 3.2 1B Instruct", + "display_name": "Llama 3.2 1B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0.01, + "output": 0.01 + }, + "type": "chat" + }, + { + "id": "meta/llama-3.2-11b-vision-instruct", + "name": "Llama 3.2 11B Vision Instruct", + "display_name": "Llama 3.2 11B Vision Instruct", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0.055, + "output": 0.055 + }, + "type": "chat" + }, + { + "id": "meta/llama-3.2-3b-instruct", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0.02, + "output": 0.02 + }, + "type": "chat" + }, + { + "id": "meta/llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0.025, + "output": 0.025 }, "type": "chat" } @@ -167648,9 +176441,9 @@ "type": "chat" }, { - "id": "minimax-m2.7", - "name": "minimax-m2.7", - "display_name": "minimax-m2.7", + "id": "minimax-m2.1", + "name": "minimax-m2.1", + "display_name": "minimax-m2.1", "modalities": { "input": [ "text" @@ -167660,8 +176453,8 @@ ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 204800, + "output": 131072 }, "tool_call": true, "reasoning": { @@ -167670,19 +176463,13 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2025-12-23", + "last_updated": "2026-01-19", "type": "chat" }, { @@ -167725,9 +176512,9 @@ "type": "chat" }, { - "id": "glm-4.7", - "name": "glm-4.7", - "display_name": "glm-4.7", + "id": "glm-5.1", + "name": "glm-5.1", + "display_name": "glm-5.1", "modalities": { "input": [ "text" @@ -167758,18 +176545,17 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-22", - "last_updated": "2026-01-19", + "release_date": "2026-03-27", + "last_updated": "2026-04-07", "type": "chat" }, { - "id": "qwen3.5:397b", - "name": "qwen3.5:397b", - "display_name": "qwen3.5:397b", + "id": "kimi-k2:1t", + "name": "kimi-k2:1t", + "display_name": "kimi-k2:1t", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -167777,34 +176563,54 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 262144 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-11", + "last_updated": "2026-01-19", + "type": "chat" + }, + { + "id": "minimax-m2", + "name": "minimax-m2", + "display_name": "minimax-m2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-02-15", - "last_updated": "2026-02-17", + "release_date": "2025-10-23", + "last_updated": "2026-01-19", "type": "chat" }, { - "id": "glm-5", - "name": "glm-5", - "display_name": "glm-5", + "id": "deepseek-v4-pro", + "name": "deepseek-v4-pro", + "display_name": "deepseek-v4-pro", "modalities": { "input": [ "text" @@ -167814,8 +176620,8 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 1048576, + "output": 1048576 }, "tool_call": true, "reasoning": { @@ -167835,41 +176641,46 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "type": "chat" }, { - "id": "qwen3-vl:235b-instruct", - "name": "qwen3-vl:235b-instruct", - "display_name": "qwen3-vl:235b-instruct", + "id": "deepseek-v3.2", + "name": "deepseek-v3.2", + "display_name": "deepseek-v3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 163840, + "output": 65536 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": true, - "release_date": "2025-09-22", + "release_date": "2025-06-15", "last_updated": "2026-01-19", "type": "chat" }, { - "id": "minimax-m2", - "name": "minimax-m2", - "display_name": "minimax-m2", + "id": "minimax-m2.5", + "name": "minimax-m2.5", + "display_name": "minimax-m2.5", "modalities": { "input": [ "text" @@ -167880,11 +176691,12 @@ }, "limit": { "context": 204800, - "output": 128000 + "output": 131072 }, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -167893,14 +176705,15 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-10-23", - "last_updated": "2026-01-19", + "knowledge": "2025-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "type": "chat" }, { - "id": "minimax-m2.1", - "name": "minimax-m2.1", - "display_name": "minimax-m2.1", + "id": "glm-4.6", + "name": "glm-4.6", + "display_name": "glm-4.6", "modalities": { "input": [ "text" @@ -167910,7 +176723,7 @@ ] }, "limit": { - "context": 204800, + "context": 202752, "output": 131072 }, "tool_call": true, @@ -167925,14 +176738,14 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-23", + "release_date": "2025-09-29", "last_updated": "2026-01-19", "type": "chat" }, { - "id": "glm-5.1", - "name": "glm-5.1", - "display_name": "glm-5.1", + "id": "minimax-m2.7", + "name": "minimax-m2.7", + "display_name": "minimax-m2.7", "modalities": { "input": [ "text" @@ -167942,8 +176755,8 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 196608, + "output": 196608 }, "tool_call": true, "reasoning": { @@ -167963,18 +176776,17 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-04-07", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "type": "chat" }, { - "id": "mistral-large-3:675b", - "name": "mistral-large-3:675b", - "display_name": "mistral-large-3:675b", + "id": "kimi-k2-thinking", + "name": "kimi-k2-thinking", + "display_name": "kimi-k2-thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -167985,32 +176797,6 @@ "output": 262144 }, "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2026-01-19", - "type": "chat" - }, - { - "id": "deepseek-v4-flash", - "name": "deepseek-v4-flash", - "display_name": "deepseek-v4-flash", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1048576, - "output": 1048576 - }, - "tool_call": true, "reasoning": { "supported": true, "default": true @@ -168028,46 +176814,42 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2026-01-19", "type": "chat" }, { - "id": "glm-4.6", - "name": "glm-4.6", - "display_name": "glm-4.6", + "id": "qwen3-vl:235b-instruct", + "name": "qwen3-vl:235b-instruct", + "display_name": "qwen3-vl:235b-instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, + "context": 262144, "output": 131072 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-09-29", + "release_date": "2025-09-22", "last_updated": "2026-01-19", "type": "chat" }, { - "id": "kimi-k2.6", - "name": "kimi-k2.6", - "display_name": "kimi-k2.6", + "id": "qwen3.5:397b", + "name": "qwen3.5:397b", + "display_name": "qwen3.5:397b", "modalities": { "input": [ "text", @@ -168079,7 +176861,7 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 65536 }, "tool_call": true, "reasoning": { @@ -168088,19 +176870,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": true, - "release_date": "2026-04-20", - "last_updated": "2026-04-20", + "release_date": "2026-02-15", + "last_updated": "2026-02-17", "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "deepseek-v4-pro", - "display_name": "deepseek-v4-pro", + "id": "deepseek-v4-flash", + "name": "deepseek-v4-flash", + "display_name": "deepseek-v4-flash", "modalities": { "input": [ "text" @@ -168136,9 +176924,9 @@ "type": "chat" }, { - "id": "minimax-m2.5", - "name": "minimax-m2.5", - "display_name": "minimax-m2.5", + "id": "glm-4.7", + "name": "glm-4.7", + "display_name": "glm-4.7", "modalities": { "input": [ "text" @@ -168148,7 +176936,7 @@ ] }, "limit": { - "context": 204800, + "context": 202752, "output": 131072 }, "tool_call": true, @@ -168158,20 +176946,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2025-12-22", + "last_updated": "2026-01-19", "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "deepseek-v3.2", - "display_name": "deepseek-v3.2", + "id": "glm-5", + "name": "glm-5", + "display_name": "glm-5", "modalities": { "input": [ "text" @@ -168181,8 +176974,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 202752, + "output": 131072 }, "tool_call": true, "reasoning": { @@ -168191,22 +176984,29 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2025-06-15", - "last_updated": "2026-01-19", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "kimi-k2-thinking", - "display_name": "kimi-k2-thinking", + "id": "kimi-k2.6", + "name": "kimi-k2.6", + "display_name": "kimi-k2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -168223,29 +177023,23 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2026-01-19", + "release_date": "2026-04-20", + "last_updated": "2026-04-20", "type": "chat" }, { - "id": "kimi-k2:1t", - "name": "kimi-k2:1t", - "display_name": "kimi-k2:1t", + "id": "mistral-large-3:675b", + "name": "mistral-large-3:675b", + "display_name": "mistral-large-3:675b", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -168259,10 +177053,9 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-11", + "release_date": "2025-12-02", "last_updated": "2026-01-19", "type": "chat" } @@ -171998,7 +180791,7 @@ "default": true }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172022,7 +180815,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172046,7 +180839,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172070,7 +180863,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172095,7 +180888,7 @@ "supported": false }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172120,7 +180913,7 @@ "supported": false }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "embedding" }, { @@ -172145,7 +180938,7 @@ "supported": false }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "embedding" }, { @@ -172171,7 +180964,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172197,7 +180990,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172223,7 +181016,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172249,7 +181042,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172275,7 +181068,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172293,7 +181086,7 @@ }, "limit": { "context": 256000, - "output": 32000 + "output": 64000 }, "tool_call": true, "reasoning": { @@ -172301,7 +181094,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172327,7 +181120,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172353,7 +181146,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172379,7 +181172,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172405,7 +181198,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172431,7 +181224,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172457,7 +181250,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172481,7 +181274,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172507,7 +181300,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172531,7 +181324,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172552,7 +181345,7 @@ "supported": false }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z" + "last_updated": "2026-05-12T04:12:03Z" }, { "id": "doubao-seedance-1-0-pro-fast-251015", @@ -172572,7 +181365,7 @@ "supported": false }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z" + "last_updated": "2026-05-12T04:12:03Z" }, { "id": "doubao-seedance-1-5-pro-251215", @@ -172593,7 +181386,7 @@ "supported": false }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z" + "last_updated": "2026-05-12T04:12:03Z" }, { "id": "doubao-seedance-2-0-260128", @@ -172615,7 +181408,7 @@ "supported": false }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z" + "last_updated": "2026-05-12T04:12:03Z" }, { "id": "doubao-seedance-2-0-fast-260128", @@ -172637,7 +181430,7 @@ "supported": false }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z" + "last_updated": "2026-05-12T04:12:03Z" }, { "id": "doubao-seedream-4-0-250828", @@ -172653,7 +181446,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "imageGeneration" }, { @@ -172670,7 +181463,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "imageGeneration" }, { @@ -172691,7 +181484,7 @@ "supported": false }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "imageGeneration" }, { @@ -172711,7 +181504,7 @@ "supported": false }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "imageGeneration" }, { @@ -172731,7 +181524,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172756,7 +181549,7 @@ "default": true }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172776,7 +181569,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172796,7 +181589,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172816,7 +181609,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172836,7 +181629,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172856,7 +181649,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" } ] @@ -174195,6 +182988,58 @@ }, "type": "chat" }, + { + "id": "qwen/qwen3.6-35b-a3b", + "name": "Qwen3.6-35B-A3B", + "display_name": "Qwen3.6-35B-A3B", + "limit": { + "context": 262144, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, + { + "id": "qwen/qwen3.6-plus", + "name": "Qwen3.6-Plus", + "display_name": "Qwen3.6-Plus", + "limit": { + "context": 1000000, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, { "id": "xiaomimimo/mimo-v2-flash", "name": "XiaomiMiMo/MiMo-V2-Flash", @@ -174654,12 +183499,7 @@ }, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "type": "chat" }, @@ -179381,6 +188221,37 @@ }, "type": "chat" }, + { + "id": "gpt-5.5-pro", + "name": "gpt-5.5-pro", + "display_name": "gpt-5.5-pro", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 1050000, + "output": 1050000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "cost": { + "input": 30, + "output": 180, + "cache_read": 30 + }, + "type": "chat" + }, { "id": "deepseek-v4-flash", "name": "deepseek-v4-flash", @@ -180176,13 +189047,13 @@ "type": "imageGeneration" }, { - "id": "wan2.7-videoedit", - "name": "wan2.7-videoedit", - "display_name": "wan2.7-videoedit", + "id": "wan2.7-i2v", + "name": "wan2.7-i2v", + "display_name": "wan2.7-i2v", "modalities": { "input": [ - "text", - "video" + "image", + "text" ] }, "limit": { @@ -180200,12 +189071,13 @@ "type": "chat" }, { - "id": "wan2.7-t2v", - "name": "wan2.7-t2v", - "display_name": "wan2.7-t2v", + "id": "wan2.7-videoedit", + "name": "wan2.7-videoedit", + "display_name": "wan2.7-videoedit", "modalities": { "input": [ - "text" + "text", + "video" ] }, "limit": { @@ -180223,13 +189095,12 @@ "type": "chat" }, { - "id": "wan2.7-r2v", - "name": "wan2.7-r2v", - "display_name": "wan2.7-r2v", + "id": "wan2.7-t2v", + "name": "wan2.7-t2v", + "display_name": "wan2.7-t2v", "modalities": { "input": [ - "text", - "video" + "text" ] }, "limit": { @@ -180247,13 +189118,13 @@ "type": "chat" }, { - "id": "wan2.7-i2v", - "name": "wan2.7-i2v", - "display_name": "wan2.7-i2v", + "id": "wan2.7-r2v", + "name": "wan2.7-r2v", + "display_name": "wan2.7-r2v", "modalities": { "input": [ - "image", - "text" + "text", + "video" ] }, "limit": { @@ -180271,9 +189142,9 @@ "type": "chat" }, { - "id": "wan2.7-image", - "name": "wan2.7-image", - "display_name": "wan2.7-image", + "id": "wan2.7-image-pro", + "name": "wan2.7-image-pro", + "display_name": "wan2.7-image-pro", "modalities": { "input": [ "text", @@ -180296,9 +189167,9 @@ "type": "imageGeneration" }, { - "id": "wan2.7-image-pro", - "name": "wan2.7-image-pro", - "display_name": "wan2.7-image-pro", + "id": "wan2.7-image", + "name": "wan2.7-image", + "display_name": "wan2.7-image", "modalities": { "input": [ "text", @@ -182559,56 +191430,6 @@ }, "type": "chat" }, - { - "id": "web-gpt-image-2-vip", - "name": "web-gpt-image-2-vip", - "display_name": "web-gpt-image-2-vip", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 4, - "output": 8, - "cache_read": 0 - }, - "type": "imageGeneration" - }, - { - "id": "web-gpt-image-2", - "name": "web-gpt-image-2", - "display_name": "web-gpt-image-2", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 4, - "output": 8, - "cache_read": 0 - }, - "type": "imageGeneration" - }, { "id": "gpt-4.1-free", "name": "gpt-4.1-free", @@ -184111,31 +192932,6 @@ }, "type": "chat" }, - { - "id": "web-gpt-image-1.5", - "name": "web-gpt-image-1.5", - "display_name": "web-gpt-image-1.5", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 4, - "output": 8, - "cache_read": 0 - }, - "type": "imageGeneration" - }, { "id": "gpt-5", "name": "gpt-5", @@ -184213,35 +193009,6 @@ }, "type": "chat" }, - { - "id": "deepseek-v3.2-speciale", - "name": "deepseek-v3.2-speciale", - "display_name": "deepseek-v3.2-speciale", - "modalities": { - "input": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 128000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "cost": { - "input": 0.58, - "output": 1.680028 - }, - "type": "chat" - }, { "id": "deepseek-v3.2-think", "name": "deepseek-v3.2-think", @@ -184272,36 +193039,6 @@ }, "type": "chat" }, - { - "id": "deepseek-math-v2", - "name": "deepseek-math-v2", - "display_name": "deepseek-math-v2", - "modalities": { - "input": [ - "text" - ] - }, - "limit": { - "context": 163000, - "output": 163000 - }, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "cost": { - "input": 0.492, - "output": 1.968, - "cache_read": 0.0984 - }, - "type": "chat" - }, { "id": "gpt-5-codex", "name": "gpt-5-codex", @@ -185506,25 +194243,6 @@ }, "type": "chat" }, - { - "id": "web-sora-2", - "name": "web-sora-2", - "display_name": "web-sora-2", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 2, - "output": 2, - "cache_read": 2 - }, - "type": "chat" - }, { "id": "wan2.2-i2v-plus", "name": "wan2.2-i2v-plus", @@ -185619,25 +194337,6 @@ }, "type": "chat" }, - { - "id": "web-sora-2-pro", - "name": "web-sora-2-pro", - "display_name": "web-sora-2-pro", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 2, - "output": 2, - "cache_read": 2 - }, - "type": "chat" - }, { "id": "kimi-for-coding-free", "name": "kimi-for-coding-free", @@ -186201,29 +194900,6 @@ }, "type": "chat" }, - { - "id": "DeepSeek-V3.1-Fast", - "name": "DeepSeek-V3.1-Fast", - "display_name": "DeepSeek-V3.1-Fast", - "modalities": { - "input": [ - "text" - ] - }, - "limit": { - "context": 163000, - "output": 163000 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "cost": { - "input": 1.096, - "output": 3.288 - }, - "type": "chat" - }, { "id": "claude-opus-4-0", "name": "claude-opus-4-0", @@ -187083,62 +195759,6 @@ }, "type": "chat" }, - { - "id": "grok-4-fast-non-reasoning", - "name": "grok-4-fast-non-reasoning", - "display_name": "grok-4-fast-non-reasoning", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 2000000, - "output": 2000000 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 - }, - "type": "chat" - }, - { - "id": "grok-4-fast-reasoning", - "name": "grok-4-fast-reasoning", - "display_name": "grok-4-fast-reasoning", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 2000000, - "output": 2000000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 - }, - "type": "chat" - }, { "id": "kimi-k2-0711", "name": "kimi-k2-0711", @@ -187547,6 +196167,62 @@ }, "type": "chat" }, + { + "id": "grok-4-fast-non-reasoning", + "name": "grok-4-fast-non-reasoning", + "display_name": "grok-4-fast-non-reasoning", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 2000000, + "output": 2000000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + }, + "type": "chat" + }, + { + "id": "grok-4-fast-reasoning", + "name": "grok-4-fast-reasoning", + "display_name": "grok-4-fast-reasoning", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 2000000, + "output": 2000000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + }, + "type": "chat" + }, { "id": "DeepSeek-OCR", "name": "DeepSeek-OCR", @@ -187590,9 +196266,9 @@ "type": "chat" }, { - "id": "veo-3.1-fast-generate-preview", - "name": "veo-3.1-fast-generate-preview", - "display_name": "veo-3.1-fast-generate-preview", + "id": "veo-3.1-generate-preview", + "name": "veo-3.1-generate-preview", + "display_name": "veo-3.1-generate-preview", "modalities": { "input": [ "text", @@ -187610,14 +196286,15 @@ }, "cost": { "input": 2, - "output": 0 + "output": 2, + "cache_read": 0 }, "type": "chat" }, { - "id": "veo-3.1-generate-preview", - "name": "veo-3.1-generate-preview", - "display_name": "veo-3.1-generate-preview", + "id": "veo-3.1-fast-generate-preview", + "name": "veo-3.1-fast-generate-preview", + "display_name": "veo-3.1-fast-generate-preview", "modalities": { "input": [ "text", @@ -187635,8 +196312,7 @@ }, "cost": { "input": 2, - "output": 2, - "cache_read": 0 + "output": 0 }, "type": "chat" }, @@ -190641,31 +199317,6 @@ }, "type": "chat" }, - { - "id": "gpt-4o-image-vip", - "name": "gpt-4o-image-vip", - "display_name": "gpt-4o-image-vip", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 4, - "output": 16, - "cache_read": 0 - }, - "type": "imageGeneration" - }, { "id": "Doubao-1.5-thinking-pro", "name": "Doubao-1.5-thinking-pro", @@ -190726,31 +199377,6 @@ }, "type": "chat" }, - { - "id": "gpt-4o-image", - "name": "gpt-4o-image", - "display_name": "gpt-4o-image", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 4, - "output": 16, - "cache_read": 0 - }, - "type": "imageGeneration" - }, { "id": "gemma-3-1b-it", "name": "gemma-3-1b-it", @@ -191138,82 +199764,6 @@ }, "type": "chat" }, - { - "id": "ERNIE-X1.1-Preview", - "name": "ERNIE-X1.1-Preview", - "display_name": "ERNIE-X1.1-Preview", - "modalities": { - "input": [ - "text" - ] - }, - "limit": { - "context": 119000, - "output": 119000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "cost": { - "input": 0.136, - "output": 0.544 - }, - "type": "chat" - }, - { - "id": "Qwen/QwQ-32B", - "name": "Qwen/QwQ-32B", - "display_name": "Qwen/QwQ-32B", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": true, - "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "cost": { - "input": 0.14, - "output": 0.56 - }, - "type": "chat" - }, - { - "id": "chutesai/Mistral-Small-3.1-24B-Instruct-2503", - "name": "chutesai/Mistral-Small-3.1-24B-Instruct-2503", - "display_name": "chutesai/Mistral-Small-3.1-24B-Instruct-2503", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.2, - "output": 0.8 - }, - "type": "chat" - }, { "id": "minimax-m2", "name": "minimax-m2", @@ -191244,96 +199794,17 @@ "type": "chat" }, { - "id": "kat-dev", - "name": "kat-dev", - "display_name": "kat-dev", - "modalities": { - "input": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 128000 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.137, - "output": 0.548 - }, - "type": "chat" - }, - { - "id": "llama-3.3-70b", - "name": "llama-3.3-70b", - "display_name": "llama-3.3-70b", - "limit": { - "context": 65536, - "output": 65536 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.6, - "output": 0.6 - }, - "type": "chat" - }, - { - "id": "moonshotai/Kimi-Dev-72B", - "name": "moonshotai/Kimi-Dev-72B", - "display_name": "moonshotai/Kimi-Dev-72B", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.32, - "output": 1.28, - "cache_read": 0 - }, - "type": "chat" - }, - { - "id": "moonshotai/Moonlight-16B-A3B-Instruct", - "name": "moonshotai/Moonlight-16B-A3B-Instruct", - "display_name": "moonshotai/Moonlight-16B-A3B-Instruct", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.2, - "output": 0.2, - "cache_read": 0 - }, - "type": "chat" - }, - { - "id": "nvidia-nemotron-3-super-120b-a12b", - "name": "nvidia-nemotron-3-super-120b-a12b", - "display_name": "nvidia-nemotron-3-super-120b-a12b", + "id": "ERNIE-X1.1-Preview", + "name": "ERNIE-X1.1-Preview", + "display_name": "ERNIE-X1.1-Preview", "modalities": { "input": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 119000, + "output": 119000 }, "tool_call": true, "reasoning": { @@ -191346,50 +199817,44 @@ } }, "cost": { - "input": 0.11, - "output": 0.55, - "cache_read": 0.0275 + "input": 0.136, + "output": 0.544 }, "type": "chat" }, { - "id": "o1-global", - "name": "o1-global", - "display_name": "o1-global", + "id": "Qwen/QwQ-32B", + "name": "Qwen/QwQ-32B", + "display_name": "Qwen/QwQ-32B", "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.14, + "output": 0.56 }, "type": "chat" }, { - "id": "qianfan-qi-vl", - "name": "qianfan-qi-vl", - "display_name": "qianfan-qi-vl", + "id": "chutesai/Mistral-Small-3.1-24B-Instruct-2503", + "name": "chutesai/Mistral-Small-3.1-24B-Instruct-2503", + "display_name": "chutesai/Mistral-Small-3.1-24B-Instruct-2503", "limit": { "context": 8192, "output": 8192 @@ -191400,49 +199865,7 @@ }, "cost": { "input": 0.2, - "output": 0.6 - }, - "type": "chat" - }, - { - "id": "qwen2.5-vl-72b-instruct", - "name": "qwen2.5-vl-72b-instruct", - "display_name": "qwen2.5-vl-72b-instruct", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 2.4, - "output": 7.2 - }, - "type": "chat" - }, - { - "id": "tencent/Hunyuan-A13B-Instruct", - "name": "tencent/Hunyuan-A13B-Instruct", - "display_name": "tencent/Hunyuan-A13B-Instruct", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.14, - "output": 0.56 + "output": 0.8 }, "type": "chat" }, @@ -191701,9 +200124,69 @@ "type": "chat" }, { - "id": "unsloth/gemma-3-12b-it", - "name": "unsloth/gemma-3-12b-it", - "display_name": "unsloth/gemma-3-12b-it", + "id": "kat-dev", + "name": "kat-dev", + "display_name": "kat-dev", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.137, + "output": 0.548 + }, + "type": "chat" + }, + { + "id": "llama-3.3-70b", + "name": "llama-3.3-70b", + "display_name": "llama-3.3-70b", + "limit": { + "context": 65536, + "output": 65536 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.6, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "moonshotai/Kimi-Dev-72B", + "name": "moonshotai/Kimi-Dev-72B", + "display_name": "moonshotai/Kimi-Dev-72B", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.32, + "output": 1.28, + "cache_read": 0 + }, + "type": "chat" + }, + { + "id": "moonshotai/Moonlight-16B-A3B-Instruct", + "name": "moonshotai/Moonlight-16B-A3B-Instruct", + "display_name": "moonshotai/Moonlight-16B-A3B-Instruct", "limit": { "context": 8192, "output": 8192 @@ -191714,11 +200197,135 @@ }, "cost": { "input": 0.2, - "output": 0.8, + "output": 0.2, "cache_read": 0 }, "type": "chat" }, + { + "id": "nvidia-nemotron-3-super-120b-a12b", + "name": "nvidia-nemotron-3-super-120b-a12b", + "display_name": "nvidia-nemotron-3-super-120b-a12b", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 1000000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "cost": { + "input": 0.11, + "output": 0.55, + "cache_read": 0.0275 + }, + "type": "chat" + }, + { + "id": "o1-global", + "name": "o1-global", + "display_name": "o1-global", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "cost": { + "input": 15, + "output": 60, + "cache_read": 7.5 + }, + "type": "chat" + }, + { + "id": "qianfan-qi-vl", + "name": "qianfan-qi-vl", + "display_name": "qianfan-qi-vl", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.2, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "qwen2.5-vl-72b-instruct", + "name": "qwen2.5-vl-72b-instruct", + "display_name": "qwen2.5-vl-72b-instruct", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 2.4, + "output": 7.2 + }, + "type": "chat" + }, + { + "id": "tencent/Hunyuan-A13B-Instruct", + "name": "tencent/Hunyuan-A13B-Instruct", + "display_name": "tencent/Hunyuan-A13B-Instruct", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.14, + "output": 0.56 + }, + "type": "chat" + }, { "id": "qwen-qwq-32b", "name": "qwen-qwq-32b", @@ -191780,26 +200387,21 @@ "type": "chat" }, { - "id": "claude-3-5-haiku", - "name": "claude-3-5-haiku", - "display_name": "claude-3-5-haiku", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "unsloth/gemma-3-12b-it", + "name": "unsloth/gemma-3-12b-it", + "display_name": "unsloth/gemma-3-12b-it", "limit": { - "context": 200000, - "output": 200000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 1.1, - "output": 5.5 + "input": 0.2, + "output": 0.8, + "cache_read": 0 }, "type": "chat" }, @@ -191822,20 +200424,26 @@ "type": "chat" }, { - "id": "tencent/Hunyuan-MT-7B", - "name": "tencent/Hunyuan-MT-7B", - "display_name": "tencent/Hunyuan-MT-7B", + "id": "claude-3-5-haiku", + "name": "claude-3-5-haiku", + "display_name": "claude-3-5-haiku", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 200000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.2, - "output": 0.2 + "input": 1.1, + "output": 5.5 }, "type": "chat" }, @@ -191911,6 +200519,24 @@ }, "type": "rerank" }, + { + "id": "tencent/Hunyuan-MT-7B", + "name": "tencent/Hunyuan-MT-7B", + "display_name": "tencent/Hunyuan-MT-7B", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.2, + "output": 0.2 + }, + "type": "chat" + }, { "id": "gemini-2.0-flash-lite-preview-02-05", "name": "gemini-2.0-flash-lite-preview-02-05", @@ -193603,68 +202229,6 @@ }, "type": "chat" }, - { - "id": "grok-4.20-beta-0309-non-reasoning", - "name": "grok-4.20-beta-0309-non-reasoning", - "display_name": "grok-4.20-beta-0309-non-reasoning", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 2000000, - "output": 2000000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2 - }, - "type": "chat" - }, - { - "id": "grok-4.20-beta-0309-reasoning", - "name": "grok-4.20-beta-0309-reasoning", - "display_name": "grok-4.20-beta-0309-reasoning", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 2000000, - "output": 2000000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2 - }, - "type": "chat" - }, { "id": "grok-4.20-multi-agent-beta-0309", "name": "grok-4.20-multi-agent-beta-0309", @@ -193834,6 +202398,68 @@ }, "type": "chat" }, + { + "id": "grok-4.20-beta-0309-non-reasoning", + "name": "grok-4.20-beta-0309-non-reasoning", + "display_name": "grok-4.20-beta-0309-non-reasoning", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 2000000, + "output": 2000000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "cost": { + "input": 2, + "output": 6, + "cache_read": 0.2 + }, + "type": "chat" + }, + { + "id": "grok-4.20-beta-0309-reasoning", + "name": "grok-4.20-beta-0309-reasoning", + "display_name": "grok-4.20-beta-0309-reasoning", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 2000000, + "output": 2000000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "cost": { + "input": 2, + "output": 6, + "cache_read": 0.2 + }, + "type": "chat" + }, { "id": "DESCRIBE", "name": "DESCRIBE", @@ -198555,6 +207181,60 @@ }, "type": "chat" }, + { + "id": "text-moderation-latest", + "name": "text-moderation-latest", + "display_name": "text-moderation-latest", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.2, + "output": 0.2 + }, + "type": "chat" + }, + { + "id": "text-moderation-stable", + "name": "text-moderation-stable", + "display_name": "text-moderation-stable", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.2, + "output": 0.2 + }, + "type": "chat" + }, + { + "id": "text-search-ada-doc-001", + "name": "text-search-ada-doc-001", + "display_name": "text-search-ada-doc-001", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 20, + "output": 20 + }, + "type": "chat" + }, { "id": "veo3", "name": "veo3", @@ -198583,12 +207263,15 @@ "type": "chat" }, { - "id": "tts-1-hd-1106", - "name": "tts-1-hd-1106", - "display_name": "tts-1-hd-1106", + "id": "veo-3", + "name": "veo-3", + "display_name": "veo-3", "modalities": { "input": [ - "audio" + "text", + "image", + "audio", + "video" ] }, "limit": { @@ -198600,9 +207283,11 @@ "supported": false }, "cost": { - "input": 30, - "output": 30 - } + "input": 2, + "output": 2, + "cache_read": 0 + }, + "type": "chat" }, { "id": "whisper-1", @@ -198674,9 +207359,9 @@ "type": "chat" }, { - "id": "tts-1-hd", - "name": "tts-1-hd", - "display_name": "tts-1-hd", + "id": "tts-1-hd-1106", + "name": "tts-1-hd-1106", + "display_name": "tts-1-hd-1106", "modalities": { "input": [ "audio" @@ -198696,9 +207381,9 @@ } }, { - "id": "tts-1-1106", - "name": "tts-1-1106", - "display_name": "tts-1-1106", + "id": "tts-1-hd", + "name": "tts-1-hd", + "display_name": "tts-1-hd", "modalities": { "input": [ "audio" @@ -198713,14 +207398,14 @@ "supported": false }, "cost": { - "input": 15, - "output": 15 + "input": 30, + "output": 30 } }, { - "id": "tts-1", - "name": "tts-1", - "display_name": "tts-1", + "id": "tts-1-1106", + "name": "tts-1-1106", + "display_name": "tts-1-1106", "modalities": { "input": [ "audio" @@ -198739,69 +207424,6 @@ "output": 15 } }, - { - "id": "veo-3", - "name": "veo-3", - "display_name": "veo-3", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 2, - "output": 2, - "cache_read": 0 - }, - "type": "chat" - }, - { - "id": "text-search-ada-doc-001", - "name": "text-search-ada-doc-001", - "display_name": "text-search-ada-doc-001", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 20, - "output": 20 - }, - "type": "chat" - }, - { - "id": "text-moderation-stable", - "name": "text-moderation-stable", - "display_name": "text-moderation-stable", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" - }, { "id": "yi-large", "name": "yi-large", @@ -198911,9 +207533,14 @@ "type": "chat" }, { - "id": "text-moderation-latest", - "name": "text-moderation-latest", - "display_name": "text-moderation-latest", + "id": "tts-1", + "name": "tts-1", + "display_name": "tts-1", + "modalities": { + "input": [ + "audio" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -198923,10 +207550,9 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" + "input": 15, + "output": 15 + } }, { "id": "aistudio_gemini-2.0-flash", @@ -199611,8 +208237,8 @@ "display_name": "Anthropic: Claude Haiku 4.5", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" @@ -199627,6 +208253,7 @@ "supported": true, "default": true }, + "attachment": true, "type": "imageGeneration" }, { @@ -199752,6 +208379,7 @@ ] } }, + "attachment": true, "type": "imageGeneration" }, { @@ -199802,157 +208430,209 @@ ] } }, - "type": "imageGeneration" - }, - { - "id": "anthropic/claude-opus-4.7", - "name": "Anthropic: Claude Opus 4.7", - "display_name": "Anthropic: Claude Opus 4.7", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 128000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } - }, - "type": "imageGeneration" - }, - { - "id": "anthropic/claude-sonnet-4", - "name": "Anthropic: Claude Sonnet 4", - "display_name": "Anthropic: Claude Sonnet 4", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 64000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, "attachment": true, "type": "imageGeneration" }, - { - "id": "anthropic/claude-sonnet-4.5", - "name": "Anthropic: Claude Sonnet 4.5", - "display_name": "Anthropic: Claude Sonnet 4.5", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 64000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "type": "imageGeneration" - }, - { - "id": "anthropic/claude-sonnet-4.6", - "name": "Anthropic: Claude Sonnet 4.6", - "display_name": "Anthropic: Claude Sonnet 4.6", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 128000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } - }, - "type": "imageGeneration" - }, + { + "id": "anthropic/claude-opus-4.7", + "name": "Anthropic: Claude Opus 4.7", + "display_name": "Anthropic: Claude Opus 4.7", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, + "type": "imageGeneration" + }, + { + "id": "anthropic/claude-opus-4.7-fast", + "name": "Anthropic: Claude Opus 4.7 (Fast)", + "display_name": "Anthropic: Claude Opus 4.7 (Fast)", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, + "type": "imageGeneration" + }, + { + "id": "anthropic/claude-sonnet-4", + "name": "Anthropic: Claude Sonnet 4", + "display_name": "Anthropic: Claude Sonnet 4", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 64000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "type": "imageGeneration" + }, + { + "id": "anthropic/claude-sonnet-4.5", + "name": "Anthropic: Claude Sonnet 4.5", + "display_name": "Anthropic: Claude Sonnet 4.5", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "type": "imageGeneration" + }, + { + "id": "anthropic/claude-sonnet-4.6", + "name": "Anthropic: Claude Sonnet 4.6", + "display_name": "Anthropic: Claude Sonnet 4.6", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, + "type": "imageGeneration" + }, { "id": "arcee-ai/coder-large", "name": "Arcee AI: Coder Large", @@ -200278,9 +208958,9 @@ "type": "imageGeneration" }, { - "id": "baidu/qianfan-ocr-fast:free", - "name": "Baidu: Qianfan-OCR-Fast (free)", - "display_name": "Baidu: Qianfan-OCR-Fast (free)", + "id": "baidu/qianfan-ocr-fast", + "name": "Baidu: Qianfan-OCR-Fast", + "display_name": "Baidu: Qianfan-OCR-Fast", "modalities": { "input": [ "image", @@ -200841,11 +209521,6 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "type": "chat" }, { @@ -200861,8 +209536,8 @@ ] }, "limit": { - "context": 1048576, - "output": 384000 + "context": 1048575, + "output": 1048575 }, "tool_call": true, "reasoning": { @@ -200882,6 +209557,29 @@ }, "type": "chat" }, + { + "id": "deepseek/deepseek-v4-flash:free", + "name": "DeepSeek: DeepSeek V4 Flash (free)", + "display_name": "DeepSeek: DeepSeek V4 Flash (free)", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 384000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, { "id": "deepseek/deepseek-v4-pro", "name": "DeepSeek: DeepSeek V4 Pro", @@ -201961,9 +210659,9 @@ "type": "chat" }, { - "id": "inclusionai/ring-2.6-1t:free", - "name": "inclusionAI: Ring-2.6-1T (free)", - "display_name": "inclusionAI: Ring-2.6-1T (free)", + "id": "inclusionai/ring-2.6-1t", + "name": "inclusionAI: Ring-2.6-1T", + "display_name": "inclusionAI: Ring-2.6-1T", "modalities": { "input": [ "text" @@ -202753,6 +211451,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "chat" }, { @@ -202776,6 +211475,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "chat" }, { @@ -202799,6 +211499,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "chat" }, { @@ -202822,6 +211523,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "chat" }, { @@ -202940,6 +211642,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "chat" }, { @@ -202963,6 +211666,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "chat" }, { @@ -202986,6 +211690,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "chat" }, { @@ -203010,6 +211715,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "imageGeneration" }, { @@ -203034,6 +211740,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "imageGeneration" }, { @@ -203058,6 +211765,7 @@ "supported": true, "default": true }, + "attachment": true, "type": "imageGeneration" }, { @@ -203082,6 +211790,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "imageGeneration" }, { @@ -203128,6 +211837,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "chat" }, { @@ -203246,6 +211956,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "chat" }, { @@ -203270,6 +211981,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "imageGeneration" }, { @@ -203293,7 +212005,8 @@ "tool_call": true, "reasoning": { "supported": false - } + }, + "attachment": true }, { "id": "moonshotai/kimi-k2", @@ -203422,8 +212135,8 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 262142, + "output": 262142 }, "tool_call": true, "reasoning": { @@ -205410,6 +214123,11 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "type": "imageGeneration" }, @@ -206129,6 +214847,31 @@ }, "type": "chat" }, + { + "id": "perceptron/perceptron-mk1", + "name": "Perceptron: Perceptron Mk1", + "display_name": "Perceptron: Perceptron Mk1", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32768, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "type": "imageGeneration" + }, { "id": "perplexity/sonar", "name": "Perplexity: Sonar", @@ -206383,28 +215126,6 @@ }, "type": "chat" }, - { - "id": "qwen/qwen-max", - "name": "Qwen: Qwen-Max", - "display_name": "Qwen: Qwen-Max", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32768, - "output": 8192 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "type": "chat" - }, { "id": "qwen/qwen-plus", "name": "Qwen: Qwen-Plus", @@ -206439,42 +215160,9 @@ "type": "chat" }, { - "id": "qwen/qwen-plus-2025-07-28", - "name": "Qwen: Qwen Plus 0728", - "display_name": "Qwen: Qwen Plus 0728", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 32768 - }, - "tool_call": true, - "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "type": "chat" - }, - { - "id": "qwen/qwen-plus-2025-07-28:thinking", - "name": "Qwen: Qwen Plus 0728 (thinking)", - "display_name": "Qwen: Qwen Plus 0728 (thinking)", + "id": "qwen/qwen-plus-2025-07-28", + "name": "Qwen: Qwen Plus 0728", + "display_name": "Qwen: Qwen Plus 0728", "modalities": { "input": [ "text" @@ -206488,29 +215176,6 @@ "output": 32768 }, "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "type": "chat" - }, - { - "id": "qwen/qwen-turbo", - "name": "Qwen: Qwen-Turbo", - "display_name": "Qwen: Qwen-Turbo", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 - }, - "tool_call": true, "reasoning": { "supported": true }, @@ -206528,50 +215193,27 @@ "type": "chat" }, { - "id": "qwen/qwen-vl-max", - "name": "Qwen: Qwen VL Max", - "display_name": "Qwen: Qwen VL Max", + "id": "qwen/qwen-plus-2025-07-28:thinking", + "name": "Qwen: Qwen Plus 0728 (thinking)", + "display_name": "Qwen: Qwen Plus 0728 (thinking)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 1000000, "output": 32768 }, "tool_call": true, "reasoning": { - "supported": false - }, - "type": "imageGeneration" - }, - { - "id": "qwen/qwen-vl-plus", - "name": "Qwen: Qwen VL Plus", - "display_name": "Qwen: Qwen VL Plus", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "imageGeneration" + "type": "chat" }, { "id": "qwen/qwen2.5-vl-72b-instruct", @@ -208282,177 +216924,6 @@ }, "type": "chat" }, - { - "id": "x-ai/grok-3", - "name": "xAI: Grok 3", - "display_name": "xAI: Grok 3", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131072 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "type": "chat" - }, - { - "id": "x-ai/grok-3-beta", - "name": "xAI: Grok 3 Beta", - "display_name": "xAI: Grok 3 Beta", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131072 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "type": "chat" - }, - { - "id": "x-ai/grok-3-mini", - "name": "xAI: Grok 3 Mini", - "display_name": "xAI: Grok 3 Mini", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131072 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "type": "chat" - }, - { - "id": "x-ai/grok-3-mini-beta", - "name": "xAI: Grok 3 Mini Beta", - "display_name": "xAI: Grok 3 Mini Beta", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131072 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "type": "chat" - }, - { - "id": "x-ai/grok-4", - "name": "xAI: Grok 4", - "display_name": "xAI: Grok 4", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 256000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, - "type": "imageGeneration" - }, - { - "id": "x-ai/grok-4-fast", - "name": "xAI: Grok 4 Fast", - "display_name": "xAI: Grok 4 Fast", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 2000000, - "output": 30000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "type": "imageGeneration" - }, - { - "id": "x-ai/grok-4.1-fast", - "name": "xAI: Grok 4.1 Fast", - "display_name": "xAI: Grok 4.1 Fast", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 2000000, - "output": 30000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "type": "imageGeneration" - }, { "id": "x-ai/grok-4.20", "name": "xAI: Grok 4.20", @@ -208532,34 +217003,6 @@ }, "type": "imageGeneration" }, - { - "id": "x-ai/grok-code-fast-1", - "name": "xAI: Grok Code Fast 1", - "display_name": "xAI: Grok Code Fast 1", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 10000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "type": "chat" - }, { "id": "xiaomi/mimo-v2-flash", "name": "Xiaomi: MiMo-V2-Flash", @@ -208818,8 +217261,8 @@ ] }, "limit": { - "context": 204800, - "output": 204800 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -209542,6 +217985,74 @@ }, "type": "chat" }, + { + "id": "deepseek/deepseek-v4-flash", + "name": "Deepseek V4 Flash", + "display_name": "Deepseek V4 Flash", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 393216 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, + { + "id": "deepseek/deepseek-v4-pro", + "name": "Deepseek V4 Pro", + "display_name": "Deepseek V4 Pro", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 393216 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, { "id": "deepseek/deepseek-ocr-2", "name": "DeepSeek-OCR 2", @@ -210358,6 +218869,87 @@ }, "type": "chat" }, + { + "id": "zai-org/glm-5-turbo", + "name": "GLM-5-Turbo", + "display_name": "GLM-5-Turbo", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 202800, + "output": 131072 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "type": "chat" + }, + { + "id": "zai-org/glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "type": "chat" + }, + { + "id": "zai-org/glm-5v-turbo", + "name": "GLM-5V-Turbo", + "display_name": "GLM-5V-Turbo", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, { "id": "zai-org/glm-ocr", "name": "GLM-OCR", @@ -211394,6 +219986,30 @@ }, "type": "chat" }, + { + "id": "gpt-5.5-light", + "name": "gpt-5.5-light", + "display_name": "gpt-5.5-light", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1050000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, { "id": "gpt-5.5-pro", "name": "gpt-5.5-pro", @@ -211416,6 +220032,11 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "type": "chat" }, { @@ -211813,6 +220434,28 @@ }, "type": "chat" }, + { + "id": "inclusionai/ling-2.6-flash", + "name": "Ling-2.6-flash", + "display_name": "Ling-2.6-flash", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, { "id": "meta-llama/llama-3.1-8b-instruct", "name": "Llama 3.1 8B Instruct", @@ -212004,6 +220647,102 @@ }, "type": "chat" }, + { + "id": "minimax/minimax-m2.5-highspeed", + "name": "MiniMax M2.5-highspeed", + "display_name": "MiniMax M2.5-highspeed", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131100 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "type": "chat" + }, + { + "id": "minimax/minimax-m2.7", + "name": "MiniMax M2.7", + "display_name": "MiniMax M2.7", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131100 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, + { + "id": "minimax/minimax-m2.7-highspeed", + "name": "MiniMax M2.7-highspeed", + "display_name": "MiniMax M2.7-highspeed", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, { "id": "mistralai/mistral-7b-instruct", "name": "Mistral 7B Instruct", @@ -212618,6 +221357,209 @@ }, "type": "chat" }, + { + "id": "qwen/qwen3.5-122b-a10b", + "name": "Qwen3.5-122B-A10B", + "display_name": "Qwen3.5-122B-A10B", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65500 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, + { + "id": "qwen/qwen3.5-27b", + "name": "Qwen3.5-27B", + "display_name": "Qwen3.5-27B", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65500 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, + { + "id": "qwen/qwen3.5-35b-a3b", + "name": "Qwen3.5-35B-A3B", + "display_name": "Qwen3.5-35B-A3B", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65500 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, + { + "id": "qwen/qwen3.5-397b-a17b", + "name": "Qwen3.5-397B-A17B", + "display_name": "Qwen3.5-397B-A17B", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 64000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, + { + "id": "qwen/qwen3.5-plus", + "name": "Qwen3.5-Plus", + "display_name": "Qwen3.5-Plus", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 64000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, + { + "id": "inclusionai/ring-2.6-1t", + "name": "Ring-2.6-1T", + "display_name": "Ring-2.6-1T", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, { "id": "sao10k/l3-8b-lunaris", "name": "Sao10k L3 8B Lunaris", @@ -212662,6 +221604,29 @@ "default": true }, "type": "chat" + }, + { + "id": "xiaomimimo/mimo-v2.5-pro", + "name": "XiaomiMiMo/MiMo-V2.5-Pro", + "display_name": "XiaomiMiMo/MiMo-V2.5-Pro", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 131072 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" } ] }, @@ -212694,7 +221659,6 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-07-31", "release_date": "2024-10-22", "last_updated": "2024-10-22", "cost": { @@ -212725,11 +221689,11 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-01-01", "release_date": "2025-10-15", "last_updated": "2025-10-15", "cost": { @@ -212747,7 +221711,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -212783,7 +221748,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -212818,8 +221784,8 @@ "display_name": "Anthropic: Claude Opus 4.5", "modalities": { "input": [ - "pdf", "image", + "pdf", "text" ], "output": [ @@ -212838,9 +221804,8 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-01-01", "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "last_updated": "2026-03-15", "cost": { "input": 5, "output": 25, @@ -212914,16 +221879,14 @@ "display_name": "Anthropic: Claude Opus 4.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 409600, "output": 128000 }, "temperature": false, @@ -212962,10 +221925,9 @@ "release_date": "2026-04-16", "last_updated": "2026-04-16", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 4.5, + "output": 22.5, + "cache_read": 0.45 }, "type": "chat" }, @@ -212976,7 +221938,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -213011,15 +221974,16 @@ "display_name": "Anthropic: Claude Sonnet 4.5", "modalities": { "input": [ - "text", - "image" + "image", + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 1000000, "output": 64000 }, "temperature": true, @@ -213030,9 +221994,8 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "last_updated": "2026-03-15", "cost": { "input": 3, "output": 15, @@ -213416,8 +222379,9 @@ }, "limit": { "context": 163840, - "output": 163840 + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -213434,6 +222398,16 @@ ] } }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", + "cost": { + "input": 0.7, + "output": 2.5, + "cache_read": 0.35 + }, "type": "chat" }, { @@ -213449,14 +222423,23 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 32768, + "output": 7168 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "cost": { + "input": 0.15, + "output": 0.75 + }, "type": "chat" }, { @@ -213508,8 +222491,8 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, @@ -213553,8 +222536,8 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, @@ -213579,9 +222562,9 @@ "release_date": "2026-04-24", "last_updated": "2026-04-24", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 1.69, + "output": 3.38, + "cache_read": 0.13 }, "type": "chat" }, @@ -213607,14 +222590,13 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "open_weights": true, + "release_date": "2024-12-01", + "last_updated": "2026-03-15", "cost": { - "input": 0.28, - "output": 0.42, - "cache_read": 0.03 + "input": 0.32, + "output": 0.89, + "cache_read": 0.15 }, "type": "chat" }, @@ -213631,8 +222613,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -213651,14 +222633,15 @@ ] } }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "attachment": true, + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2025-12-01", + "last_updated": "2026-02-28", "cost": { - "input": 0.29, - "output": 0.43 + "input": 0.435, + "output": 0.87, + "cache_read": 0.028 }, "type": "chat" }, @@ -213675,8 +222658,8 @@ ] }, "limit": { - "context": 163000, - "output": 64000 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -213685,13 +222668,12 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", + "open_weights": true, "release_date": "2025-09-29", "last_updated": "2025-09-29", "cost": { - "input": 0.22, - "output": 0.33 + "input": 0.27, + "output": 0.41 }, "type": "chat" }, @@ -213744,12 +222726,13 @@ "attachment": true, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { "input": 0.3, "output": 2.5, - "cache_read": 0.03 + "cache_read": 0.075, + "cache_write": 0.55 }, "type": "chat" }, @@ -213759,9 +222742,11 @@ "display_name": "Google: Gemini 2.5 Flash Lite", "modalities": { "input": [ + "audio", "image", + "pdf", "text", - "audio" + "video" ], "output": [ "text" @@ -213798,16 +222783,15 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-07-22", - "last_updated": "2025-07-22", + "release_date": "2025-06-17", + "last_updated": "2026-03-15", "cost": { "input": 0.1, "output": 0.4, - "cache_read": 0.03, - "cache_write": 1 + "cache_read": 0.01, + "cache_write": 0.083333 }, - "type": "imageGeneration" + "type": "chat" }, { "id": "google/gemini-2.5-pro", @@ -213862,7 +222846,8 @@ "cost": { "input": 1.25, "output": 10, - "cache_read": 0.125 + "cache_read": 0.31, + "cache_write": 2.375 }, "type": "chat" }, @@ -213923,10 +222908,11 @@ "display_name": "Google: Gemini 3.1 Flash Lite", "modalities": { "input": [ - "text", + "audio", "image", - "video", - "audio" + "pdf", + "text", + "video" ], "output": [ "text" @@ -213936,7 +222922,7 @@ "context": 1048576, "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -213949,11 +222935,13 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-02-18", - "last_updated": "2026-02-18", + "release_date": "2026-05-07", + "last_updated": "2026-05-16", "cost": { "input": 0.25, - "output": 1.5 + "output": 1.5, + "cache_read": 0.025, + "cache_write": 0.08333 }, "type": "chat" }, @@ -213963,9 +222951,10 @@ "display_name": "Google: Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ - "text", - "image", "audio", + "image", + "pdf", + "text", "video" ], "output": [ @@ -213973,13 +222962,14 @@ ] }, "limit": { - "context": 1050000, - "output": 65530 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -213988,8 +222978,8 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-03-20", - "last_updated": "2025-03-20", + "release_date": "2026-03-03", + "last_updated": "2026-03-15", "cost": { "input": 0.25, "output": 1.5 @@ -214002,11 +222992,11 @@ "display_name": "Google: Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text", - "image", - "video", "audio", - "pdf" + "image", + "pdf", + "text", + "video" ], "output": [ "text" @@ -214041,13 +223031,11 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "last_updated": "2026-03-15", "cost": { "input": 2, - "output": 12, - "cache_read": 0.2 + "output": 12 }, "type": "chat" }, @@ -214075,7 +223063,6 @@ }, "attachment": true, "open_weights": true, - "knowledge": "2024-10", "release_date": "2025-03-13", "last_updated": "2025-03-13", "cost": { @@ -214159,75 +223146,13 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-21", - "last_updated": "2026-05-01", - "cost": { - "input": 0.08, - "output": 0.24, - "cache_read": 0.016 - }, - "type": "chat" - }, - { - "id": "inclusionai/ling-flash-2.0", - "name": "inclusionAI: Ling-flash-2.0", - "display_name": "inclusionAI: Ling-flash-2.0", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", - "cost": { - "input": 0.14, - "output": 0.57 - }, - "type": "chat" - }, - { - "id": "inclusionai/ling-mini-2.0", - "name": "inclusionAI: Ling-mini-2.0", - "display_name": "inclusionAI: Ling-mini-2.0", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-10", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.1, + "output": 0.3, + "cache_read": 0.02 }, "type": "chat" }, @@ -214299,52 +223224,8 @@ ] }, "limit": { - "context": 262000, - "output": 66000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-05-08", - "last_updated": "2026-05-08", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - }, - { - "id": "inclusionai/ring-flash-2.0", - "name": "inclusionAI: Ring-flash-2.0", - "display_name": "inclusionAI: Ring-flash-2.0", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -214352,41 +223233,14 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "release_date": "2026-05-08", + "last_updated": "2026-05-16", "cost": { - "input": 0.14, - "output": 0.57 - }, - "type": "chat" - }, - { - "id": "inclusionai/ring-mini-2.0", - "name": "inclusionAI: Ring-mini-2.0", - "display_name": "inclusionAI: Ring-mini-2.0", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131072 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true + "input": 0.075, + "output": 0.625, + "cache_read": 0.015 }, "type": "chat" }, @@ -214500,8 +223354,8 @@ ] }, "limit": { - "context": 204000, - "output": 64000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -214511,19 +223365,23 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", + "open_weights": true, "release_date": "2025-10-27", "last_updated": "2025-10-27", "cost": { "input": 0.3, "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.38 + "cache_read": 0.03 }, "type": "chat" }, @@ -214720,7 +223578,7 @@ }, "limit": { "context": 204800, - "output": 131070 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -214739,14 +223597,15 @@ ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2026-03-20", - "last_updated": "2026-03-20", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.611, - "output": 2.4439 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, @@ -214826,14 +223685,13 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-09-04", - "last_updated": "2025-09-04", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "output": 2.5 }, "type": "chat" }, @@ -215239,13 +224097,33 @@ "id": "openai/gpt-5-chat", "name": "OpenAI: GPT-5 Chat", "display_name": "OpenAI: GPT-5 Chat", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 272000, - "output": 16384 + "context": 400000, + "output": 128000 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.25, + "output": 10 }, "type": "chat" }, @@ -215846,6 +224724,8 @@ "display_name": "OpenAI: GPT-5.3 Chat", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -215854,18 +224734,16 @@ }, "limit": { "context": 128000, - "output": 16380 + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-20", - "last_updated": "2026-03-20", + "release_date": "2026-03-04", + "last_updated": "2026-03-15", "cost": { "input": 1.75, "output": 14 @@ -215878,7 +224756,9 @@ "display_name": "OpenAI: GPT-5.3-Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -215888,7 +224768,7 @@ "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -215918,11 +224798,12 @@ "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2026-03-20", - "last_updated": "2026-03-20", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { "input": 1.75, - "output": 14 + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, @@ -215933,7 +224814,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -215989,6 +224871,8 @@ "display_name": "OpenAI: GPT-5.4 Mini", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -215999,7 +224883,7 @@ "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -216029,12 +224913,12 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-20", - "last_updated": "2026-03-20", + "release_date": "2026-03-17", + "last_updated": "2026-04-11", "cost": { "input": 0.75, - "output": 4.5 + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, @@ -216044,6 +224928,8 @@ "display_name": "OpenAI: GPT-5.4 Nano", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -216054,7 +224940,7 @@ "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -216082,14 +224968,14 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-20", - "last_updated": "2026-03-20", + "release_date": "2026-03-17", + "last_updated": "2026-04-11", "cost": { "input": 0.2, - "output": 1.25 + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, @@ -216100,7 +224986,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -216110,7 +224997,7 @@ "context": 1050000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -216139,11 +225026,12 @@ "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2026-03-20", - "last_updated": "2026-03-20", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 45, - "output": 225 + "input": 30, + "output": 180, + "cache_read": 30 }, "type": "chat" }, @@ -216194,9 +225082,8 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "release_date": "2026-04-24", + "last_updated": "2026-05-01", "cost": { "input": 5, "output": 30, @@ -216228,11 +225115,15 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "release_date": "2026-04-24", + "last_updated": "2026-05-01", "cost": { "input": 30, "output": 180 @@ -216298,13 +225189,22 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 52429 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "attachment": false, + "open_weights": true, + "release_date": "2025-04", + "last_updated": "2026-01", + "cost": { + "input": 0.071, + "output": 0.1 + }, "type": "chat" }, { @@ -216320,8 +225220,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -216341,12 +225241,15 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.13, - "output": 0.6 + "input": 0.11, + "output": 0.6, + "cache_read": 0.055, + "cache_write": 0.22 }, "type": "chat" }, @@ -216363,13 +225266,14 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 40960, + "output": 40960 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -216383,12 +225287,13 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2025-04", + "last_updated": "2026-03-15", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.06, + "output": 0.24, + "cache_read": 0.025 }, "type": "chat" }, @@ -216406,12 +225311,21 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 66536 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "cost": { + "input": 0.3, + "output": 1.2 }, "type": "chat" }, @@ -216428,24 +225342,22 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 1000000, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": true, + "release_date": "2025-07-01", + "last_updated": "2026-03-15", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.65, + "output": 3.25, + "cache_read": 0.2 }, "type": "chat" }, @@ -216462,8 +225374,8 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -216483,12 +225395,12 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2026-01-23", - "last_updated": "2026-01-23", + "knowledge": "2025-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 1.2, - "output": 6 + "input": 2.11, + "output": 8.45 }, "type": "chat" }, @@ -216579,7 +225491,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" @@ -216587,7 +225500,7 @@ }, "limit": { "context": 1000000, - "output": 64000 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -216606,14 +225519,14 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2026-03-20", - "last_updated": "2026-03-20", + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.8, - "output": 4.8 + "input": 0.115, + "output": 0.688 }, "type": "chat" }, @@ -216713,6 +225626,7 @@ "display_name": "Qwen: Qwen3.6-Plus", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -216721,7 +225635,7 @@ }, "limit": { "context": 1000000, - "output": 64000 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -216740,15 +225654,15 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-30", - "last_updated": "2026-03-30", + "release_date": "2025-08-26", + "last_updated": "2026-04-11", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "cache_write": 0.625 + "input": 0.325, + "output": 1.95, + "cache_read": 0.0325, + "cache_write": 0.40625 }, "type": "chat" }, @@ -216858,21 +225772,22 @@ }, "limit": { "context": 256000, - "output": 64000 + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2026-02-02", - "last_updated": "2026-02-02", + "open_weights": true, + "release_date": "2026-01-29", + "last_updated": "2026-01-29", "cost": { "input": 0.1, - "output": 0.3 + "output": 0.3, + "cache_read": 0.02 }, "type": "chat" }, @@ -216968,42 +225883,8 @@ ] }, "limit": { - "context": 256000, - "output": 64000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-20", - "last_updated": "2026-04-20", - "cost": { - "input": 0.172, - "output": 0.572, - "cache_read": 0.058, - "cache_write": 0 - }, - "type": "chat" - }, - { - "id": "x-ai/grok-4", - "name": "xAI: Grok 4", - "display_name": "xAI: Grok 4", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -217011,152 +225892,14 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 - }, - "type": "chat" - }, - { - "id": "x-ai/grok-4-fast", - "name": "xAI: Grok 4 Fast", - "display_name": "xAI: Grok 4 Fast", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 2000000, - "output": 131072 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-20", - "last_updated": "2025-09-20", - "cost": { - "input": 0.2, - "output": 0.5 - }, - "type": "chat" - }, - { - "id": "x-ai/grok-4-fast-non-reasoning", - "name": "xAI: Grok 4 Fast None Reasoning", - "display_name": "xAI: Grok 4 Fast None Reasoning", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 2000000, - "output": 30000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", - "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 - }, - "type": "chat" - }, - { - "id": "x-ai/grok-4.1-fast", - "name": "xAI: Grok 4.1 Fast", - "display_name": "xAI: Grok 4.1 Fast", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 2000000, - "output": 131072 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-20", - "last_updated": "2025-11-20", - "cost": { - "input": 0.2, - "output": 0.5 - }, - "type": "chat" - }, - { - "id": "x-ai/grok-4.1-fast-non-reasoning", - "name": "xAI: Grok 4.1 Fast Non Reasoning", - "display_name": "xAI: Grok 4.1 Fast Non Reasoning", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 2000000, - "output": 64000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-11-20", - "last_updated": "2025-11-20", + "release_date": "2026-04-22", + "last_updated": "2026-05-16", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.066, + "output": 0.26, + "cache_read": 0.029 }, "type": "chat" }, @@ -217269,42 +226012,6 @@ }, "type": "chat" }, - { - "id": "x-ai/grok-code-fast-1", - "name": "xAI: Grok Code Fast 1", - "display_name": "xAI: Grok Code Fast 1", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 131072 - }, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-28", - "last_updated": "2025-08-28", - "cost": { - "input": 0.2, - "output": 1.5 - }, - "type": "chat" - }, { "id": "xiaomi/mimo-v2-flash", "name": "Xiaomi: MiMo-V2-Flash", @@ -217352,8 +226059,8 @@ ] }, "limit": { - "context": 265000, - "output": 265000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -217386,8 +226093,8 @@ ] }, "limit": { - "context": 1000000, - "output": 256000 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -217423,8 +226130,8 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -217469,7 +226176,7 @@ }, "limit": { "context": 1048576, - "output": 131072 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -217524,14 +226231,12 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "last_updated": "2026-03-15", "cost": { "input": 0.6, "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "cache_read": 0.175 }, "type": "chat" }, @@ -217559,14 +226264,12 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", "release_date": "2025-07-28", "last_updated": "2025-07-28", "cost": { - "input": 0.2, - "output": 1.1, - "cache_read": 0.03, - "cache_write": 0 + "input": 0.13, + "output": 0.85, + "cache_read": 0.025 }, "type": "chat" }, @@ -217612,8 +226315,8 @@ "display_name": "Z.AI: GLM 4.6V", "modalities": { "input": [ - "text", "image", + "text", "video" ], "output": [ @@ -217621,8 +226324,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -217631,14 +226334,12 @@ "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "open_weights": true, + "release_date": "2025-09-30", + "last_updated": "2026-01-10", "cost": { - "input": 0.14, - "output": 0.42, - "cache_read": 0.03 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, @@ -217727,8 +226428,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 202752, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -217748,14 +226449,13 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": true, + "release_date": "2025-12-22", + "last_updated": "2026-03-15", "cost": { - "input": 0.28, - "output": 1.14, - "cache_read": 0.06 + "input": 0.38, + "output": 1.98, + "cache_read": 0.2 }, "type": "chat" }, @@ -217855,8 +226555,8 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -217877,13 +226577,11 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01-01", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.58, - "output": 2.6, - "cache_read": 0.14 + "input": 0.95, + "output": 3.15 }, "type": "chat" }, @@ -217900,8 +226598,8 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -217914,14 +226612,14 @@ "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2026-03-20", - "last_updated": "2026-03-20", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-15", + "last_updated": "2026-04-11", "cost": { - "input": 0.88, - "output": 3.48 + "input": 1.2, + "output": 4, + "cache_read": 0.24 }, "type": "chat" }, @@ -217938,7 +226636,7 @@ ] }, "limit": { - "context": 200000, + "context": 202752, "output": 131072 }, "temperature": true, @@ -217949,23 +226647,16 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-03", - "last_updated": "2026-04-03", + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.8781, - "output": 3.5126, - "cache_read": 0.1903 + "input": 1.26, + "output": 3.96 }, "type": "chat" }, @@ -217975,18 +226666,17 @@ "display_name": "Z.AI: GLM 5V Turbo", "modalities": { "input": [ - "text", "image", - "video", - "pdf" + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -217994,25 +226684,14 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, - "open_weights": false, + "open_weights": true, "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "last_updated": "2026-04-11", "cost": { - "input": 0.726, - "output": 3.1946, - "cache_read": 0.1743 + "input": 1.2, + "output": 4, + "cache_read": 0.24 }, "type": "chat" } diff --git a/scripts/plugin.mjs b/scripts/plugin.mjs new file mode 100644 index 000000000..cdc3f52b8 --- /dev/null +++ b/scripts/plugin.mjs @@ -0,0 +1,156 @@ +import { execFileSync } from 'node:child_process' +import { existsSync, readFileSync, readdirSync } from 'node:fs' +import path from 'node:path' + +const OFFICIAL_PLUGIN_SOURCE = 'deepchat-official' + +function parseArgs(argv) { + const args = { + action: null, + name: null, + platform: process.env.TARGET_PLATFORM || process.platform, + arch: process.env.TARGET_ARCH || process.arch, + pluginRoot: null + } + args.action = argv[0] + for (let i = 1; i < argv.length; i += 1) { + if (argv[i] === '--name') { + args.name = argv[++i] + } else if (argv[i] === '--platform') { + args.platform = argv[++i] + } else if (argv[i] === '--arch') { + args.arch = argv[++i] + } else if (argv[i] === '--plugin-root') { + args.pluginRoot = path.resolve(argv[++i]) + } + } + if (!args.action || !['validate', 'package', 'bundle', 'verify'].includes(args.action)) { + console.error( + 'Usage: node scripts/plugin.mjs [--name ] [--platform

] [--arch ] [--plugin-root ]' + ) + process.exit(1) + } + if (args.action !== 'verify' && !args.name) { + console.error('Missing required --name argument') + process.exit(1) + } + if (args.action === 'verify' && !args.pluginRoot) { + console.error('Missing required --plugin-root argument for verify') + process.exit(1) + } + return args +} + +const args = parseArgs(process.argv.slice(2)) +const packageVersion = JSON.parse(readFileSync(path.resolve('package.json'), 'utf8')).version + +function readPluginManifest(pluginName) { + const pluginDir = path.resolve('plugins', pluginName) + const manifestPath = path.join(pluginDir, 'plugin.json') + if (!existsSync(manifestPath)) { + throw new Error(`Plugin not found: ${manifestPath}`) + } + const manifest = JSON.parse(readFileSync(manifestPath, 'utf8')) + return { pluginDir, manifest } +} + +function discoverOfficialPlugins() { + const pluginsRoot = path.resolve('plugins') + if (!existsSync(pluginsRoot)) { + return [] + } + + return readdirSync(pluginsRoot, { withFileTypes: true }) + .filter((entry) => entry.isDirectory()) + .map((entry) => { + try { + const { manifest } = readPluginManifest(entry.name) + if (manifest.source?.type !== OFFICIAL_PLUGIN_SOURCE) { + return null + } + return { + name: entry.name, + manifest, + platforms: manifest.engines?.platforms ?? [] + } + } catch { + return null + } + }) + .filter(Boolean) + .sort((a, b) => a.name.localeCompare(b.name)) +} + +function isPluginSupported(plugin, targetPlatform) { + const platforms = new Set(plugin.platforms.map((platform) => String(platform).toLowerCase())) + const aliases = targetPlatform === 'darwin' ? ['darwin', 'macos', 'mac'] : [targetPlatform] + return aliases.some((platform) => platforms.has(platform)) +} + +function artifactBaseName(pluginId) { + return pluginId.startsWith('com.deepchat.plugins.') + ? `deepchat-plugin-${pluginId.slice('com.deepchat.plugins.'.length)}` + : pluginId +} + +function artifactFileName(plugin, targetPlatform, targetArch) { + const safeId = artifactBaseName(plugin.manifest.id).replace(/[^a-zA-Z0-9._-]/g, '-') + return `${safeId}-${packageVersion}-${targetPlatform}-${targetArch}.dcplugin` +} + +function verifyArtifacts(options) { + const pluginRoot = path.resolve(options.pluginRoot) + const officialPlugins = discoverOfficialPlugins() + const selected = options.name + ? officialPlugins.filter((plugin) => plugin.name === options.name) + : officialPlugins + + if (options.name && selected.length === 0) { + throw new Error(`Official plugin not found: ${options.name}`) + } + + const expected = selected.filter((plugin) => isPluginSupported(plugin, options.platform)) + if (expected.length === 0) { + throw new Error(`No official plugins are expected for ${options.platform}/${options.arch}`) + } + + for (const plugin of expected) { + const fileName = artifactFileName(plugin, options.platform, options.arch) + const artifactPath = path.join(pluginRoot, fileName) + if (!existsSync(artifactPath)) { + throw new Error(`Missing bundled official plugin: ${artifactPath}`) + } + console.log(`Verified ${path.relative(process.cwd(), artifactPath)}`) + } +} + +try { + if (args.action === 'verify') { + verifyArtifacts(args) + process.exit(0) + } + + const { pluginDir } = readPluginManifest(args.name) + + // Run native build step if the plugin has one (e.g. scripts/build-cua-plugin-runtime.mjs) + const nativeBuildScript = path.resolve(`scripts/build-${args.name}-plugin-runtime.mjs`) + if (args.action === 'bundle' && existsSync(nativeBuildScript)) { + const buildArgs = [nativeBuildScript] + if (args.arch) buildArgs.push('--arch', args.arch) + execFileSync('node', buildArgs, { stdio: 'inherit' }) + } + + // Delegate to package-plugin.mjs + const pkgArgs = [path.resolve('scripts/package-plugin.mjs')] + if (args.action === 'validate') pkgArgs.push('--validate') + pkgArgs.push('--release-version-from-root') + if (args.platform) pkgArgs.push('--target-platform', args.platform) + if (args.arch) pkgArgs.push('--target-arch', args.arch) + if (args.action === 'bundle') pkgArgs.push('--out', path.resolve('build/bundled-plugins')) + pkgArgs.push(pluginDir) + + execFileSync('node', pkgArgs, { stdio: 'inherit' }) +} catch (error) { + console.error(error instanceof Error ? error.message : String(error)) + process.exit(1) +} diff --git a/src/main/lib/agentRuntime/questionTool.ts b/src/main/lib/agentRuntime/questionTool.ts index 5160f259c..979dcecb6 100644 --- a/src/main/lib/agentRuntime/questionTool.ts +++ b/src/main/lib/agentRuntime/questionTool.ts @@ -59,6 +59,7 @@ export const questionToolSchema = z 'Whether free-form input is allowed for this question. The field name is `custom`, not `allowOther`.' ) }) + .strict() .describe( 'Ask exactly one blocking clarification question. For multiple clarifications, use multiple deepchat_question tool calls instead of sending a `questions` array.' ) diff --git a/src/main/presenter/agentRuntimePresenter/dispatch.ts b/src/main/presenter/agentRuntimePresenter/dispatch.ts index 81ff3ac2f..1cf17167a 100644 --- a/src/main/presenter/agentRuntimePresenter/dispatch.ts +++ b/src/main/presenter/agentRuntimePresenter/dispatch.ts @@ -12,7 +12,9 @@ import type { SearchResult } from '@shared/types/core/search' import type { IToolPresenter } from '@shared/types/presenters/tool.presenter' import type { AgentToolProgressUpdate } from '@shared/types/presenters/tool.presenter' import type { AssistantMessageBlock, PermissionMode } from '@shared/types/agent-interface' +import type { AgentPlanSnapshot } from '@shared/types/agent-plan' import { parseQuestionToolArgs, QUESTION_TOOL_NAME } from '../../lib/agentRuntime/questionTool' +import { UPDATE_PLAN_TOOL_NAME } from '../toolPresenter/agentTools/agentPlanTool' import type { InterleavedReasoningConfig, IoParams, @@ -354,6 +356,32 @@ function updateSubagentToolCallBlock( } } +function markInternalPlanToolCallBlock(blocks: AssistantMessageBlock[], toolCallId: string): void { + const block = blocks.find( + (item) => item.type === 'tool_call' && item.tool_call?.id === toolCallId + ) + if (!block?.tool_call || block.tool_call.name !== UPDATE_PLAN_TOOL_NAME) { + return + } + + block.extra = { + ...block.extra, + internalTool: true + } +} + +function publishPlanUpdated(io: IoParams, snapshot: AgentPlanSnapshot): void { + publishDeepchatEvent('chat.plan.updated', { + sessionId: io.sessionId, + messageId: io.messageId, + ...(snapshot.toolCallId ? { toolCallId: snapshot.toolCallId } : {}), + plan: snapshot.plan, + ...(snapshot.explanation ? { explanation: snapshot.explanation } : {}), + revision: snapshot.revision, + updatedAt: snapshot.updatedAt + }) +} + function extractSubagentToolState(rawData: MCPToolResponse): { subagentProgress?: string subagentFinal?: string @@ -799,6 +827,18 @@ async function runToolCall(params: { try { const applyProgressUpdate = (update: AgentToolProgressUpdate) => { + if ( + update.kind === 'agent_plan' && + update.toolCallId === completedToolCall.id && + allowProgressUpdates + ) { + markInternalPlanToolCallBlock(state.blocks, completedToolCall.id) + publishPlanUpdated(io, update.snapshot) + state.dirty = true + scheduleRendererFlush(state, rendererFlushHandle) + return + } + if ( !allowProgressUpdates || update.kind !== 'subagent_orchestrator' || diff --git a/src/main/presenter/agentRuntimePresenter/index.ts b/src/main/presenter/agentRuntimePresenter/index.ts index ac7198b10..473f8bd01 100644 --- a/src/main/presenter/agentRuntimePresenter/index.ts +++ b/src/main/presenter/agentRuntimePresenter/index.ts @@ -57,7 +57,13 @@ import { normalizeImageGenerationOptions, supportsOpenAIImageGenerationSettings } from '@shared/imageGenerationSettings' -import { isDeepSeekSeriesModelId } from '@shared/model' +import { ApiEndpointType, ModelType, isDeepSeekSeriesModelId } from '@shared/model' +import { isTtsModelConfig, isTtsModelId } from '@shared/ttsSettings' +import { + isVideoGenerationModelConfig, + normalizeVideoGenerationOptions, + supportsOpenAICompatibleVideoGeneration +} from '@shared/videoGenerationSettings' import { nanoid } from 'nanoid' import type { SQLitePresenter } from '../sqlitePresenter' import { eventBus, SendTarget } from '@/eventbus' @@ -621,6 +627,8 @@ export class AgentRuntimePresenter implements IAgentImplementation { try { this.throwIfAbortRequested(preStreamAbortSignal) const generationSettings = await this.getEffectiveSessionGenerationSettings(sessionId) + const modelConfig = this.configPresenter.getModelConfig(state.modelId, state.providerId) + const useContextBudget = this.shouldUseDeepChatContextBudget(state.providerId, modelConfig) this.throwIfAbortRequested(preStreamAbortSignal) const interleavedReasoning = this.resolveInterleavedReasoningConfig( state.providerId, @@ -629,7 +637,8 @@ export class AgentRuntimePresenter implements IAgentImplementation { ) const contextBudgetLength = this.resolveDeepChatContextBudgetLength( state.providerId, - generationSettings.contextLength + generationSettings.contextLength, + modelConfig ) const maxTokens = capAgentRequestMaxTokens(generationSettings.maxTokens, contextBudgetLength) const activeSkillNames = await this.resolveActiveSkillNamesForToolProfile(sessionId) @@ -656,9 +665,8 @@ export class AgentRuntimePresenter implements IAgentImplementation { think: false } - const compactionIntent = this.shouldBypassDeepChatContextBudget(state.providerId) - ? null - : await this.compactionService.prepareForNextUserTurn({ + const compactionIntent = useContextBudget + ? await this.compactionService.prepareForNextUserTurn({ sessionId, providerId: state.providerId, modelId: state.modelId, @@ -674,6 +682,7 @@ export class AgentRuntimePresenter implements IAgentImplementation { newUserContent: normalizedInput, signal: preStreamAbortSignal }) + : null let summaryState: SessionSummaryState if (compactionIntent) { @@ -1428,15 +1437,53 @@ export class AgentRuntimePresenter implements IAgentImplementation { return resolvedProviderId === 'acp' } - private shouldBypassDeepChatContextBudget(providerId?: string | null): boolean { - return providerId?.trim() === 'acp' + private shouldUseDeepChatContextBudget( + providerId?: string | null, + modelConfig?: Pick | null, + modelId?: string | null + ): boolean { + if (providerId?.trim() === 'acp') { + return false + } + + if (!modelConfig) { + return true + } + + if (modelConfig.type === ModelType.ImageGeneration || modelConfig.type === ModelType.TTS) { + return false + } + + if (modelConfig.apiEndpoint && modelConfig.apiEndpoint !== ApiEndpointType.Chat) { + return false + } + + if (modelConfig.endpointType === 'image-generation') { + return false + } + + if (isVideoGenerationModelConfig(modelConfig, modelId?.trim() || '')) { + return false + } + + return true + } + + private shouldBypassDeepChatContextBudget( + providerId?: string | null, + modelConfig?: Pick | null, + modelId?: string | null + ): boolean { + return !this.shouldUseDeepChatContextBudget(providerId, modelConfig, modelId) } private resolveDeepChatContextBudgetLength( providerId: string | null | undefined, - contextLength: number + contextLength: number, + modelConfig?: Pick | null, + modelId?: string | null ): number { - return this.shouldBypassDeepChatContextBudget(providerId) + return this.shouldBypassDeepChatContextBudget(providerId, modelConfig, modelId) ? Number.MAX_SAFE_INTEGER : contextLength } @@ -1619,7 +1666,8 @@ export class AgentRuntimePresenter implements IAgentImplementation { if (!state) { throw new Error(`Session ${sessionId} not found`) } - if (this.shouldBypassDeepChatContextBudget(state.providerId)) { + const modelConfig = this.configPresenter.getModelConfig(state.modelId, state.providerId) + if (this.shouldBypassDeepChatContextBudget(state.providerId, modelConfig, state.modelId)) { throw new Error('Manual compaction is only available for DeepChat agent sessions.') } if (state.status !== 'idle') { @@ -1639,7 +1687,9 @@ export class AgentRuntimePresenter implements IAgentImplementation { ) const contextBudgetLength = this.resolveDeepChatContextBudgetLength( state.providerId, - generationSettings.contextLength + generationSettings.contextLength, + modelConfig, + state.modelId ) const maxTokens = capAgentRequestMaxTokens(generationSettings.maxTokens, contextBudgetLength) const activeSkillNames = await this.resolveActiveSkillNamesForToolProfile(sessionId) @@ -1854,15 +1904,16 @@ export class AgentRuntimePresenter implements IAgentImplementation { ).getProviderInstance(state.providerId) const generationSettings = await this.getEffectiveSessionGenerationSettings(sessionId) + const baseModelConfig = this.configPresenter.getModelConfig(state.modelId, state.providerId) const interleavedReasoning = providedInterleavedReasoning ?? this.resolveInterleavedReasoningConfig(state.providerId, state.modelId, generationSettings) - const bypassContextBudget = this.shouldBypassDeepChatContextBudget(state.providerId) const contextBudgetLength = this.resolveDeepChatContextBudgetLength( state.providerId, - generationSettings.contextLength + generationSettings.contextLength, + baseModelConfig, + state.modelId ) - const baseModelConfig = this.configPresenter.getModelConfig(state.modelId, state.providerId) const capabilityProviderId = this.resolveCapabilityProviderId(state.providerId, state.modelId) const reasoningPortrait = this.getReasoningPortrait(state.providerId, state.modelId) const modelConfig: ModelConfig = { @@ -1876,6 +1927,7 @@ export class AgentRuntimePresenter implements IAgentImplementation { reasoningVisibility: generationSettings.reasoningVisibility, verbosity: generationSettings.verbosity, imageGeneration: generationSettings.imageGeneration, + videoGeneration: generationSettings.videoGeneration, reasoning: getReasoningEffectiveEnabledForProvider(capabilityProviderId, reasoningPortrait, { reasoning: baseModelConfig.reasoning, reasoningEffort: generationSettings.reasoningEffort ?? baseModelConfig.reasoningEffort @@ -1886,6 +1938,7 @@ export class AgentRuntimePresenter implements IAgentImplementation { const traceEnabled = this.configPresenter.getSetting('traceDebugEnabled') === true const llmProviderPresenter = this.llmProviderPresenter const pendingInputCoordinator = this.pendingInputCoordinator + const shouldBypassContextBudget = this.shouldBypassDeepChatContextBudget.bind(this) const injectSteerInputsIntoRequest = this.injectSteerInputsIntoRequest.bind(this) const recoverContextPressure = this.recoverRequestContextPressure.bind(this) const replaceLeadingSystemPromptInPlace = this.replaceLeadingSystemPromptInPlace.bind(this) @@ -1947,13 +2000,19 @@ export class AgentRuntimePresenter implements IAgentImplementation { requestMaxTokens, requestTools ) { + const requestBypassesContextBudget = shouldBypassContextBudget( + state.providerId, + requestModelConfig + ) const claimedSteerBatch = pendingInputCoordinator.claimSteerBatchForNextLoop(sessionId) const injectedMessages = injectSteerInputsIntoRequest( requestMessages, claimedSteerBatch, supportsVision, supportsAudioInput, - bypassContextBudget ? Number.MAX_SAFE_INTEGER : requestModelConfig.contextLength, + requestBypassesContextBudget + ? Number.MAX_SAFE_INTEGER + : requestModelConfig.contextLength, requestMaxTokens ) @@ -1963,15 +2022,18 @@ export class AgentRuntimePresenter implements IAgentImplementation { try { let providerMessages = injectedMessages let providerMaxTokens = requestMaxTokens + const isTtsRequest = + isTtsModelConfig(requestModelConfig) || isTtsModelId(requestModelId) + const effectiveRequestTools: MCPToolDefinition[] = isTtsRequest ? [] : requestTools - if (!bypassContextBudget) { + if (!requestBypassesContextBudget) { const protectedSteerTailCount = claimedSteerBatch.length > 0 ? claimedSteerBatch.length + (requestMessages.at(-1)?.role === 'user' ? 1 : 0) : 0 let requestPreflight = preflightRequestContext({ messages: injectedMessages, - tools: requestTools, + tools: effectiveRequestTools, contextLength: requestModelConfig.contextLength, requestedMaxTokens: requestMaxTokens, minimumProtectedTailCount: protectedSteerTailCount @@ -1988,7 +2050,7 @@ export class AgentRuntimePresenter implements IAgentImplementation { baseSystemPrompt, contextLength: requestModelConfig.contextLength, requestedMaxTokens: requestPreflight.requestedMaxTokens, - tools: requestTools, + tools: effectiveRequestTools, supportsVision, supportsAudioInput, interleavedReasoning, @@ -2001,7 +2063,7 @@ export class AgentRuntimePresenter implements IAgentImplementation { } requestPreflight = preflightRequestContext({ messages: requestMessages, - tools: requestTools, + tools: effectiveRequestTools, contextLength: requestModelConfig.contextLength, requestedMaxTokens: requestMaxTokens, minimumProtectedTailCount: protectedSteerTailCount @@ -2041,7 +2103,7 @@ export class AgentRuntimePresenter implements IAgentImplementation { requestModelConfig, requestTemperature, providerMaxTokens, - requestTools + effectiveRequestTools )) { if (!didConsumeSteerBatch && claimedSteerBatch.length > 0) { pendingInputCoordinator.consumeClaimedSteerBatch(sessionId) @@ -2543,6 +2605,8 @@ export class AgentRuntimePresenter implements IAgentImplementation { preStreamAbortSignal = preStreamAbortController.signal this.throwIfAbortRequested(preStreamAbortSignal) const generationSettings = await this.getEffectiveSessionGenerationSettings(sessionId) + const modelConfig = this.configPresenter.getModelConfig(state.modelId, state.providerId) + const useContextBudget = this.shouldUseDeepChatContextBudget(state.providerId, modelConfig) this.throwIfAbortRequested(preStreamAbortSignal) const interleavedReasoning = this.resolveInterleavedReasoningConfig( state.providerId, @@ -2551,7 +2615,9 @@ export class AgentRuntimePresenter implements IAgentImplementation { ) const contextBudgetLength = this.resolveDeepChatContextBudgetLength( state.providerId, - generationSettings.contextLength + generationSettings.contextLength, + modelConfig, + state.modelId ) const maxTokens = capAgentRequestMaxTokens(generationSettings.maxTokens, contextBudgetLength) const projectDir = this.resolveProjectDir(sessionId) @@ -2570,9 +2636,8 @@ export class AgentRuntimePresenter implements IAgentImplementation { activeSkillNames ) this.throwIfAbortRequested(preStreamAbortSignal) - const summaryState = this.shouldBypassDeepChatContextBudget(state.providerId) - ? this.sessionStore.getSummaryState(sessionId) - : await this.resolveCompactionStateForResumeTurn({ + const summaryState = useContextBudget + ? await this.resolveCompactionStateForResumeTurn({ sessionId, messageId, providerId: state.providerId, @@ -2588,6 +2653,7 @@ export class AgentRuntimePresenter implements IAgentImplementation { interleavedReasoning.preserveEmptyReasoningContent === true, signal: preStreamAbortSignal }) + : this.sessionStore.getSummaryState(sessionId) this.throwIfAbortRequested(preStreamAbortSignal) const systemPrompt = appendSummarySection(baseSystemPrompt, summaryState.summaryText) let resumeContext = buildResumeContext( @@ -2608,11 +2674,7 @@ export class AgentRuntimePresenter implements IAgentImplementation { interleavedReasoning.preserveEmptyReasoningContent === true } ) - if ( - budgetToolCall?.id && - budgetToolCall.name && - !this.shouldBypassDeepChatContextBudget(state.providerId) - ) { + if (budgetToolCall?.id && budgetToolCall.name && useContextBudget) { const resumeBudget = this.fitResumeBudgetForToolCall({ resumeContext, toolDefinitions: tools, @@ -3389,6 +3451,22 @@ export class AgentRuntimePresenter implements IAgentImplementation { } } + if ( + supportsOpenAICompatibleVideoGeneration({ + providerId, + providerApiType: this.resolveProviderApiType(providerId), + modelId, + apiEndpoint: modelConfig.apiEndpoint, + endpointType: modelConfig.endpointType, + type: modelConfig.type + }) + ) { + const videoGeneration = normalizeVideoGenerationOptions(modelConfig.videoGeneration) + if (videoGeneration) { + defaults.videoGeneration = videoGeneration + } + } + const supportsReasoning = this.configPresenter.supportsReasoningCapability?.(providerId, modelId) === true if (supportsReasoning) { @@ -3633,6 +3711,35 @@ export class AgentRuntimePresenter implements IAgentImplementation { delete next.imageGeneration } + if ( + supportsOpenAICompatibleVideoGeneration({ + providerId, + providerApiType: this.resolveProviderApiType(providerId), + modelId, + apiEndpoint: modelConfig.apiEndpoint, + endpointType: modelConfig.endpointType, + type: modelConfig.type + }) + ) { + if (Object.prototype.hasOwnProperty.call(patch, 'videoGeneration')) { + const videoGeneration = normalizeVideoGenerationOptions(patch.videoGeneration) + if (videoGeneration) { + next.videoGeneration = videoGeneration + } else { + delete next.videoGeneration + } + } else { + const videoGeneration = normalizeVideoGenerationOptions(next.videoGeneration) + if (videoGeneration) { + next.videoGeneration = videoGeneration + } else { + delete next.videoGeneration + } + } + } else { + delete next.videoGeneration + } + if (fixedTemperatureKimi) { next.temperature = fixedTemperatureKimi.temperature } diff --git a/src/main/presenter/agentRuntimePresenter/messageStore.ts b/src/main/presenter/agentRuntimePresenter/messageStore.ts index 8169a1bf6..383c4bea5 100644 --- a/src/main/presenter/agentRuntimePresenter/messageStore.ts +++ b/src/main/presenter/agentRuntimePresenter/messageStore.ts @@ -65,6 +65,20 @@ type StructuredMessageMaps = { assistantRows: Map } +function normalizePersistedActionType( + actionType: string | null +): AssistantMessageBlock['action_type'] | undefined { + if ( + actionType === 'tool_call_permission' || + actionType === 'question_request' || + actionType === 'rate_limit' + ) { + return actionType + } + + return undefined +} + function extractSearchableMessageContent(rawContent: string): string { try { const parsed = JSON.parse(rawContent) as @@ -761,6 +775,7 @@ export class DeepChatMessageStore { : undefined const imageData = extra.imageData?.trim() + const actionType = normalizePersistedActionType(row.action_type) return { id: extra.id, @@ -778,7 +793,7 @@ export class DeepChatMessageStore { : undefined, tool_call: toolCall as AssistantMessageBlock['tool_call'], extra: extra.extra, - action_type: row.action_type as AssistantMessageBlock['action_type'] + ...(actionType ? { action_type: actionType } : {}) } } diff --git a/src/main/presenter/configPresenter/index.ts b/src/main/presenter/configPresenter/index.ts index 50975d173..35512639e 100644 --- a/src/main/presenter/configPresenter/index.ts +++ b/src/main/presenter/configPresenter/index.ts @@ -27,6 +27,7 @@ import { resolveProviderCapabilityProviderId, type NewApiEndpointType } from '@shared/model' +import { resolveVideoGenerationCompatType } from '@shared/videoGenerationSettings' import { DEFAULT_MODEL_CAPABILITY_FALLBACKS, resolveDerivedModelMaxTokens, @@ -973,6 +974,15 @@ export class ConfigPresenter implements IConfigPresenter { } private inferProviderDbModelType(model: ProviderModel): ModelType { + const videoGenerationType = resolveVideoGenerationCompatType({ + modelId: model.id, + type: model.type, + modalities: model.modalities + }) + if (videoGenerationType) { + return videoGenerationType + } + if (Array.isArray(model.modalities?.output) && model.modalities.output.includes('image')) { return ModelType.ImageGeneration } @@ -984,6 +994,10 @@ export class ConfigPresenter implements IConfigPresenter { return ModelType.Rerank case 'imageGeneration': return ModelType.ImageGeneration + case 'videoGeneration': + return ModelType.VideoGeneration + case 'tts': + return ModelType.TTS case 'chat': default: return ModelType.Chat diff --git a/src/main/presenter/configPresenter/modelConfig.ts b/src/main/presenter/configPresenter/modelConfig.ts index ec524ce8c..fcd2c709c 100644 --- a/src/main/presenter/configPresenter/modelConfig.ts +++ b/src/main/presenter/configPresenter/modelConfig.ts @@ -13,6 +13,7 @@ import { resolveModelFunctionCall } from '@shared/modelConfigDefaults' import { applyMoonshotKimiReasoningTemperaturePolicy } from '@shared/moonshotKimiPolicy' +import { resolveVideoGenerationCompatType } from '@shared/videoGenerationSettings' import ElectronStore from 'electron-store' import { providerDbLoader } from './providerDbLoader' import { @@ -105,6 +106,15 @@ export class ModelConfigHelper { * Priority: 1. modalities.output includes image 2. model.type (from provider.json) 3. default Chat */ private inferModelType(model: ProviderModel): ModelType { + const videoGenerationType = resolveVideoGenerationCompatType({ + modelId: model.id, + type: model.type, + modalities: model.modalities + }) + if (videoGenerationType) { + return videoGenerationType + } + // Priority 1: Output modality indicates image generation if (Array.isArray(model.modalities?.output) && model.modalities.output.includes('image')) { return ModelType.ImageGeneration @@ -121,6 +131,10 @@ export class ModelConfigHelper { return ModelType.Rerank case 'imageGeneration': return ModelType.ImageGeneration + case 'videoGeneration': + return ModelType.VideoGeneration + case 'tts': + return ModelType.TTS default: // Invalid type, fall through to default break @@ -176,7 +190,13 @@ export class ModelConfigHelper { reasoning: Boolean(reasoningEnabled), type: modelType, apiEndpoint: - modelType === ModelType.ImageGeneration ? ApiEndpointType.Image : ApiEndpointType.Chat, + modelType === ModelType.ImageGeneration + ? ApiEndpointType.Image + : modelType === ModelType.VideoGeneration + ? ApiEndpointType.Video + : modelType === ModelType.TTS + ? ApiEndpointType.AudioSpeech + : ApiEndpointType.Chat, thinkingBudget, forceInterleavedThinkingCompat, reasoningEffort, diff --git a/src/main/presenter/configPresenter/providerModelHelper.ts b/src/main/presenter/configPresenter/providerModelHelper.ts index e71a2833d..6ded4e17d 100644 --- a/src/main/presenter/configPresenter/providerModelHelper.ts +++ b/src/main/presenter/configPresenter/providerModelHelper.ts @@ -2,6 +2,7 @@ import { eventBus, SendTarget } from '@/eventbus' import { CONFIG_EVENTS } from '@/events' import { ModelConfig, MODEL_META } from '@shared/presenter' import { ModelType } from '@shared/model' +import { resolveVideoGenerationCompatType } from '@shared/videoGenerationSettings' import ElectronStore from 'electron-store' import path from 'path' import type { StoreLike } from './storeLike' @@ -143,16 +144,30 @@ export class ProviderModelHelper { normalizedModel.reasoning !== undefined ? normalizedModel.reasoning : config.reasoning || false - normalizedModel.type = - normalizedModel.type !== undefined ? normalizedModel.type : config.type || ModelType.Chat normalizedModel.endpointType = config.endpointType ?? normalizedModel.endpointType + normalizedModel.type = + resolveVideoGenerationCompatType({ + modelId: normalizedModel.id, + type: config.type ?? normalizedModel.type, + apiEndpoint: config.apiEndpoint, + endpointType: normalizedModel.endpointType, + supportedEndpointTypes: normalizedModel.supportedEndpointTypes + }) ?? + (normalizedModel.type !== undefined ? normalizedModel.type : config.type || ModelType.Chat) return normalizedModel } normalizedModel.vision = normalizedModel.vision || false normalizedModel.functionCall = normalizedModel.functionCall || false normalizedModel.reasoning = normalizedModel.reasoning || false - normalizedModel.type = normalizedModel.type || ModelType.Chat + normalizedModel.type = + resolveVideoGenerationCompatType({ + modelId: normalizedModel.id, + type: normalizedModel.type, + endpointType: normalizedModel.endpointType, + supportedEndpointTypes: normalizedModel.supportedEndpointTypes + }) ?? + (normalizedModel.type || ModelType.Chat) return normalizedModel } diff --git a/src/main/presenter/index.ts b/src/main/presenter/index.ts index dfb631d9d..5c3a65308 100644 --- a/src/main/presenter/index.ts +++ b/src/main/presenter/index.ts @@ -388,6 +388,14 @@ export class Presenter implements IPresenter { modelId, imageOptions, options + ), + generateVideoStandalone: (providerId, prompt, modelId, videoOptions, options) => + this.llmproviderPresenter.generateVideoStandalone( + providerId, + prompt, + modelId, + videoOptions, + options ) }), cacheImage: (data) => this.devicePresenter.cacheImage(data), diff --git a/src/main/presenter/llmProviderPresenter/aiSdk/runtime.ts b/src/main/presenter/llmProviderPresenter/aiSdk/runtime.ts index ea7207aa4..bf5cf959b 100644 --- a/src/main/presenter/llmProviderPresenter/aiSdk/runtime.ts +++ b/src/main/presenter/llmProviderPresenter/aiSdk/runtime.ts @@ -19,13 +19,34 @@ import { supportsOpenAIImageGenerationSettings, type ImageGenerationOptions } from '@shared/imageGenerationSettings' +import { + isVideoGenerationModelConfig, + normalizeVideoGenerationOptions, + resolveOpenAICompatibleVideoRequestBodyShape, + type VideoGenerationOptions, + type VideoGenerationReference +} from '@shared/videoGenerationSettings' +import { + isChatAudioTtsModel, + isGeminiGenerateContentTtsModel, + isTtsModelId, + isTtsModelConfig, + normalizeTtsSettings, + ttsFormatToMimeType +} from '@shared/ttsSettings' import { presenter } from '@/presenter' import { EMBEDDING_TEST_KEY, isNormalized } from '@/utils/vector' import type { LLMCoreStreamEvent } from '@shared/types/core/llm-events' import { mcpToolsToAISDKTools } from './toolMapper' import { mapMessagesToModelMessages } from './messageMapper' import { buildProviderOptions } from './providerOptionsMapper' -import { type AiSdkProviderKind, createAiSdkProviderContext } from './providerFactory' +import { ProxyAgent } from 'undici' +import { proxyConfig } from '../../proxyConfig' +import { + type AiSdkProviderKind, + createAiSdkProviderContext, + normalizeGeminiBaseUrl +} from './providerFactory' import { adaptAiSdkStream } from './streamAdapter' type ImageGenerationProviderPayload = Record @@ -34,6 +55,41 @@ type ImageGenerationRequestOptions = { providerOptions?: Record } +type VideoGenerationRequestBody = { + model: string + prompt: string + seconds?: string + size?: string + input_reference?: string | { mime_type?: string; data: string } + content?: Array> + ratio?: string + duration?: number + resolution?: string + watermark?: boolean + generate_audio?: boolean + extra_body?: Record +} + +type VideoGenerationTaskResponse = { + id?: string + status?: string + url?: string | null + error?: + | string + | { + message?: string + } + | null +} + +const DEFAULT_GEMINI_TTS_VOICE = 'Kore' +const DEFAULT_GEMINI_PCM_SAMPLE_RATE = 24000 +const DEFAULT_GEMINI_PCM_BITS_PER_SAMPLE = 16 +const VIDEO_GENERATION_POLL_INTERVAL_MS = 3000 +const PROMPT_VIDEO_DURATION_EN_PATTERN = + /(^|[^0-9a-z])(?\d{1,2})\s*(?:s|sec|secs|second|seconds)\b/i +const PROMPT_VIDEO_DURATION_ZH_PATTERN = /(?\d{1,2})\s*秒/u + export interface AiSdkRuntimeContext { providerKind: AiSdkProviderKind provider: LLM_PROVIDER @@ -53,6 +109,8 @@ export interface AiSdkRuntimeContext { cleanHeaders?: boolean supportsNativeTools?: (modelId: string, modelConfig: ModelConfig) => boolean shouldUseImageGeneration?: (modelId: string, modelConfig: ModelConfig) => boolean + shouldUseVideoGeneration?: (modelId: string, modelConfig: ModelConfig) => boolean + shouldUseTts?: (modelId: string, modelConfig: ModelConfig) => boolean } function resolveCapabilityProviderId(context: AiSdkRuntimeContext, modelId: string): string { @@ -127,6 +185,63 @@ function normalizePromptValue(value: unknown): string { return '' } +function supportsPromptDerivedVideoDuration(modelId: string, duration: number): boolean { + const normalizedModelId = modelId.trim().toLowerCase() + + if (normalizedModelId.startsWith('doubao-seedance-')) { + return duration >= 4 && duration <= 15 + } + + return true +} + +function resolvePromptVideoDuration(prompt: string, modelId: string): number | undefined { + const normalizedPrompt = prompt.trim() + if (!normalizedPrompt) { + return undefined + } + + const matchedDuration = + normalizedPrompt.match(PROMPT_VIDEO_DURATION_EN_PATTERN)?.groups?.duration || + normalizedPrompt.match(PROMPT_VIDEO_DURATION_ZH_PATTERN)?.groups?.duration + + if (!matchedDuration) { + return undefined + } + + const parsed = Number.parseInt(matchedDuration, 10) + if (!Number.isFinite(parsed) || parsed <= 0) { + return undefined + } + + return supportsPromptDerivedVideoDuration(modelId, parsed) ? parsed : undefined +} + +function resolveVideoGenerationRequestOptions( + prompt: string, + modelId: string, + options: VideoGenerationOptions | undefined +): VideoGenerationOptions | undefined { + const normalizedOptions = normalizeVideoGenerationOptions(options) + + if ( + typeof normalizedOptions?.duration === 'number' || + (typeof normalizedOptions?.seconds === 'string' && normalizedOptions.seconds.trim().length > 0) + ) { + return normalizedOptions + } + + const promptDuration = resolvePromptVideoDuration(prompt, modelId) + if (promptDuration === undefined) { + return normalizedOptions + } + + return normalizeVideoGenerationOptions({ + ...normalizedOptions, + duration: promptDuration + }) +} + function extractImagePrompt(messages: ChatMessage[]): string { return messages .map((message) => (message.role === 'user' ? normalizePromptValue(message.content) : '')) @@ -134,6 +249,10 @@ function extractImagePrompt(messages: ChatMessage[]): string { .join('\n\n') } +function extractVideoPrompt(messages: ChatMessage[]): string { + return extractImagePrompt(messages) +} + function resolveSupportsNativeTools( context: AiSdkRuntimeContext, modelId: string, @@ -158,6 +277,357 @@ function shouldUseImageGenerationRuntime( return modelConfig.apiEndpoint === ApiEndpointType.Image } +function shouldUseVideoGenerationRuntime( + context: AiSdkRuntimeContext, + modelId: string, + modelConfig: ModelConfig +): boolean { + if (context.shouldUseVideoGeneration) { + return context.shouldUseVideoGeneration(modelId, modelConfig) + } + + return ( + modelConfig.apiEndpoint === ApiEndpointType.Video || + isVideoGenerationModelConfig(modelConfig, modelId) + ) +} + +function shouldUseTtsRuntime( + context: AiSdkRuntimeContext, + modelId: string, + modelConfig: ModelConfig +): boolean { + if (context.shouldUseTts) { + return context.shouldUseTts(modelId, modelConfig) + } + + return ( + modelConfig.apiEndpoint === ApiEndpointType.AudioSpeech || + isTtsModelConfig(modelConfig) || + isTtsModelId(modelId) + ) +} + +function buildGeminiTtsPrompt(text: string, instructions?: string): string { + if (instructions?.trim()) { + return `${instructions.trim()}\n\n${text}`.trim() + } + + return text.trim() +} + +function resolveGeminiTtsBaseUrl(provider: LLM_PROVIDER): string { + const rawBaseUrl = (provider.baseUrl || '').trim() + + if (provider.apiType === 'gemini' || provider.id === 'gemini') { + return normalizeGeminiBaseUrl(rawBaseUrl || undefined) + } + + if (rawBaseUrl) { + try { + const parsed = new URL(rawBaseUrl.includes('://') ? rawBaseUrl : `https://${rawBaseUrl}`) + if (provider.id === 'aihubmix' || /(^|\.)aihubmix\.com$/i.test(parsed.hostname)) { + return normalizeGeminiBaseUrl(`${parsed.origin}/gemini`) + } + } catch { + // Fall through to provider-specific fallback below. + } + } + + if (provider.id === 'aihubmix') { + return normalizeGeminiBaseUrl('https://aihubmix.com/gemini') + } + + return normalizeGeminiBaseUrl(rawBaseUrl || undefined) +} + +function normalizeGeminiTtsResponseAudio( + base64: string, + mimeType: string | undefined +): { base64: string; mimeType: string } { + const normalizedMimeType = (mimeType || '').trim() + const lowerMimeType = normalizedMimeType.toLowerCase() + + if (!lowerMimeType || !(lowerMimeType.includes('l16') || lowerMimeType.includes('audio/pcm'))) { + return { + base64, + mimeType: normalizedMimeType || 'audio/wav' + } + } + + const sampleRate = Number(/(?:rate|samplerate)=(\d+)/i.exec(normalizedMimeType)?.[1]) + const bitsPerSample = Number(/(?:bits|bitspersample)=(\d+)/i.exec(normalizedMimeType)?.[1]) + const pcmBuffer = Buffer.from(base64, 'base64') + const resolvedSampleRate = + Number.isFinite(sampleRate) && sampleRate > 0 ? sampleRate : DEFAULT_GEMINI_PCM_SAMPLE_RATE + const resolvedBitsPerSample = + Number.isFinite(bitsPerSample) && bitsPerSample > 0 + ? bitsPerSample + : DEFAULT_GEMINI_PCM_BITS_PER_SAMPLE + const blockAlign = resolvedBitsPerSample / 8 + const byteRate = resolvedSampleRate * blockAlign + const wavBuffer = Buffer.alloc(44 + pcmBuffer.length) + + wavBuffer.write('RIFF', 0) + wavBuffer.writeUInt32LE(36 + pcmBuffer.length, 4) + wavBuffer.write('WAVE', 8) + wavBuffer.write('fmt ', 12) + wavBuffer.writeUInt32LE(16, 16) + wavBuffer.writeUInt16LE(1, 20) + wavBuffer.writeUInt16LE(1, 22) + wavBuffer.writeUInt32LE(resolvedSampleRate, 24) + wavBuffer.writeUInt32LE(byteRate, 28) + wavBuffer.writeUInt16LE(blockAlign, 32) + wavBuffer.writeUInt16LE(resolvedBitsPerSample, 34) + wavBuffer.write('data', 36) + wavBuffer.writeUInt32LE(pcmBuffer.length, 40) + pcmBuffer.copy(wavBuffer, 44) + + return { + base64: wavBuffer.toString('base64'), + mimeType: 'audio/wav' + } +} + +/** + * Extracts the text to be synthesized from the last user message in the conversation. + */ +function extractTtsText(messages: ChatMessage[]): string { + for (let i = messages.length - 1; i >= 0; i--) { + const msg = messages[i] + if (msg.role === 'user') { + const text = normalizePromptValue(msg.content) + if (text.trim()) return text.trim() + } + } + return '' +} + +/** + * Pattern A: calls the standard OpenAI-compatible /audio/speech endpoint. + */ +async function executeTtsPatternA( + provider: LLM_PROVIDER, + defaultHeaders: Record, + text: string, + modelId: string, + modelConfig: ModelConfig, + timeout: number | undefined +): Promise<{ base64: string; mimeType: string }> { + const tts = normalizeTtsSettings(modelConfig.tts) + const format = tts?.responseFormat ?? 'mp3' + const baseUrl = (provider.baseUrl || '').replace(/\/+$/, '').replace(/\/v1$/i, '') + const url = `${baseUrl}/v1/audio/speech` + + const body: Record = { + model: modelId, + input: text, + voice: tts?.voice ?? 'alloy', + response_format: format + } + if (tts?.speed !== undefined) { + body.speed = tts.speed + } + if (tts?.instructions) { + body.instructions = tts.instructions + } + + const controller = new AbortController() + const timeoutId = timeout ? setTimeout(() => controller.abort(), timeout) : undefined + const proxyUrl = proxyConfig.getProxyUrl() + const dispatcher = proxyUrl ? new ProxyAgent(proxyUrl) : undefined + + try { + const fetchInit: RequestInit & { dispatcher?: ProxyAgent } = { + method: 'POST', + headers: { + ...defaultHeaders, + 'Content-Type': 'application/json', + Authorization: `Bearer ${provider.oauthToken || provider.apiKey || ''}` + }, + body: JSON.stringify(body), + signal: controller.signal + } + if (dispatcher) fetchInit.dispatcher = dispatcher + const response = await fetch(url, fetchInit) + + if (!response.ok) { + const errText = await response.text().catch(() => '') + throw new Error(`TTS request failed (${response.status}): ${errText}`) + } + + const buffer = await response.arrayBuffer() + const base64 = Buffer.from(buffer).toString('base64') + return { base64, mimeType: ttsFormatToMimeType(format) } + } finally { + if (timeoutId !== undefined) clearTimeout(timeoutId) + } +} + +/** + * Pattern B: calls the chat completions endpoint with audio output + * (e.g. xiaomimimo mimo-v2.5-tts series). + */ +async function executeTtsPatternB( + provider: LLM_PROVIDER, + defaultHeaders: Record, + text: string, + modelId: string, + modelConfig: ModelConfig, + timeout: number | undefined +): Promise<{ base64: string; mimeType: string }> { + const tts = normalizeTtsSettings(modelConfig.tts) + const format = tts?.responseFormat ?? 'wav' + const baseUrl = (provider.baseUrl || '').replace(/\/+$/, '').replace(/\/v1$/i, '') + const url = `${baseUrl}/v1/chat/completions` + + const body: Record = { + model: modelId, + messages: [ + { role: 'user', content: text }, + { role: 'assistant', content: text } + ], + modalities: ['text', 'audio'], + audio: { + format, + ...(tts?.voice ? { voice: tts.voice } : {}) + } + } + + const controller = new AbortController() + const timeoutId = timeout ? setTimeout(() => controller.abort(), timeout) : undefined + const proxyUrl = proxyConfig.getProxyUrl() + const dispatcher = proxyUrl ? new ProxyAgent(proxyUrl) : undefined + + try { + const fetchInit: RequestInit & { dispatcher?: ProxyAgent } = { + method: 'POST', + headers: { + ...defaultHeaders, + 'Content-Type': 'application/json', + Authorization: `Bearer ${provider.oauthToken || provider.apiKey || ''}` + }, + body: JSON.stringify(body), + signal: controller.signal + } + if (dispatcher) fetchInit.dispatcher = dispatcher + const response = await fetch(url, fetchInit) + + if (!response.ok) { + const errText = await response.text().catch(() => '') + throw new Error(`TTS (chat audio) request failed (${response.status}): ${errText}`) + } + + const json = (await response.json()) as { + choices?: Array<{ + message?: { + audio?: { data?: string } + content?: Array<{ type?: string; audio?: { data?: string } }> + } + }> + } + const firstMessage = json.choices?.[0]?.message + const audioData = + firstMessage?.audio?.data ?? + firstMessage?.content?.find((item) => item?.type === 'audio')?.audio?.data + if (!audioData) { + throw new Error('TTS response missing audio data in choices[0].message.audio.data') + } + + return { base64: audioData, mimeType: ttsFormatToMimeType(format) } + } finally { + if (timeoutId !== undefined) clearTimeout(timeoutId) + } +} + +async function executeTtsPatternC( + provider: LLM_PROVIDER, + defaultHeaders: Record, + text: string, + modelId: string, + modelConfig: ModelConfig, + timeout: number | undefined +): Promise<{ base64: string; mimeType: string }> { + const tts = normalizeTtsSettings(modelConfig.tts) + const baseUrl = resolveGeminiTtsBaseUrl(provider) + const requestModelId = modelId.trim().split('/').at(-1) || modelId + const url = `${baseUrl}/models/${encodeURIComponent(requestModelId)}:generateContent` + const body: Record = { + contents: [ + { + role: 'user', + parts: [ + { + text: buildGeminiTtsPrompt(text, tts?.instructions) + } + ] + } + ], + generationConfig: { + responseModalities: ['AUDIO'], + speechConfig: { + voiceConfig: { + prebuiltVoiceConfig: { + voiceName: tts?.voice ?? DEFAULT_GEMINI_TTS_VOICE + } + } + } + } + } + + const controller = new AbortController() + const timeoutId = timeout ? setTimeout(() => controller.abort(), timeout) : undefined + const proxyUrl = proxyConfig.getProxyUrl() + const dispatcher = proxyUrl ? new ProxyAgent(proxyUrl) : undefined + + try { + const fetchInit: RequestInit & { dispatcher?: ProxyAgent } = { + method: 'POST', + headers: { + ...defaultHeaders, + 'Content-Type': 'application/json', + 'x-goog-api-key': provider.oauthToken || provider.apiKey || '' + }, + body: JSON.stringify(body), + signal: controller.signal + } + if (dispatcher) fetchInit.dispatcher = dispatcher + const response = await fetch(url, fetchInit) + + if (!response.ok) { + const errText = await response.text().catch(() => '') + throw new Error(`TTS (gemini) request failed (${response.status}): ${errText}`) + } + + const json = (await response.json()) as { + candidates?: Array<{ + content?: { + parts?: Array<{ + inlineData?: { data?: string; mimeType?: string } + inline_data?: { data?: string; mime_type?: string } + }> + } + }> + } + const firstPart = json.candidates?.[0]?.content?.parts?.find( + (part) => part.inlineData?.data || part.inline_data?.data + ) + const inlineData = firstPart?.inlineData + const legacyInlineData = firstPart?.inline_data + const audioData = inlineData?.data ?? legacyInlineData?.data + if (!audioData) { + throw new Error('TTS response missing inline audio data in candidates[0].content.parts') + } + + return normalizeGeminiTtsResponseAudio( + audioData, + inlineData?.mimeType ?? legacyInlineData?.mime_type + ) + } finally { + if (timeoutId !== undefined) clearTimeout(timeoutId) + } +} + function resolveRequestTimeout(modelConfig: ModelConfig): number | undefined { const timeout = modelConfig.timeout if (typeof timeout !== 'number' || !Number.isFinite(timeout) || timeout <= 0) { @@ -271,6 +741,355 @@ function resolveRuntimeTemperature( } } +function normalizeOpenAICompatibleBaseUrl(baseUrl: string | undefined): string { + const normalized = (baseUrl || 'https://api.openai.com/v1').trim().replace(/\/+$/, '') + if (!normalized) { + return 'https://api.openai.com/v1' + } + + return /\/v1(?:beta\d+)?$/i.test(normalized) ? normalized : `${normalized}/v1` +} + +function normalizeVideoReferenceDataUrl(reference: VideoGenerationReference): string | undefined { + if (reference.url?.trim()) { + return reference.url.trim() + } + + if (!reference.data?.trim()) { + return undefined + } + + const normalizedData = reference.data.trim() + if (normalizedData.startsWith('data:')) { + return normalizedData + } + + const fallbackMimeType = + reference.mimeType?.trim() || + (reference.type === 'image' + ? 'image/png' + : reference.type === 'audio' + ? 'audio/mpeg' + : 'video/mp4') + + return `data:${fallbackMimeType};base64,${normalizedData}` +} + +function buildVideoGenerationContent( + options: VideoGenerationOptions | undefined +): Array> | undefined { + if (!options) { + return undefined + } + + const content: Record[] = [] + + for (const reference of options.references ?? []) { + const url = normalizeVideoReferenceDataUrl(reference) + if (!url) { + continue + } + + if (reference.type === 'image') { + content.push({ + type: 'image_url', + image_url: { url }, + role: 'reference_image' + }) + continue + } + + if (reference.type === 'audio') { + content.push({ + type: 'audio_url', + audio_url: { url }, + role: 'reference_audio' + }) + continue + } + + content.push({ + type: 'video_url', + video_url: { url }, + role: 'reference_video' + }) + } + + return content.length > 0 ? content : undefined +} + +function buildVideoGenerationExtraBody( + options: VideoGenerationOptions | undefined +): Record | undefined { + if (!options) { + return undefined + } + + const extraBody: Record = {} + + if (typeof options.duration === 'number' && Number.isFinite(options.duration)) { + extraBody.duration = options.duration + } + if (typeof options.ratio === 'string' && options.ratio.trim()) { + extraBody.ratio = options.ratio.trim() + } + if (typeof options.resolution === 'string' && options.resolution.trim()) { + extraBody.resolution = options.resolution.trim() + } + if (typeof options.watermark === 'boolean') { + extraBody.watermark = options.watermark + } + if (typeof options.generateAudio === 'boolean') { + extraBody.generate_audio = options.generateAudio + } + + const content = buildVideoGenerationContent(options) + if (content) { + extraBody.content = content + } + + return Object.keys(extraBody).length > 0 ? extraBody : undefined +} + +function resolveFlatTopLevelVideoDuration( + options: VideoGenerationOptions | undefined +): number | undefined { + if (typeof options?.duration === 'number' && Number.isFinite(options.duration)) { + return Math.max(-1, Math.round(options.duration)) + } + + if (typeof options?.seconds !== 'string') { + return undefined + } + + const parsed = Number.parseInt(options.seconds.trim(), 10) + return Number.isFinite(parsed) ? Math.max(-1, parsed) : undefined +} + +function buildVideoGenerationRequestBody( + provider: LLM_PROVIDER, + modelId: string, + prompt: string, + options: VideoGenerationOptions | undefined +): VideoGenerationRequestBody { + const body: VideoGenerationRequestBody = { + model: modelId, + prompt + } + + if (options?.seconds) { + body.seconds = options.seconds + } + if (options?.size) { + body.size = options.size + } + if (options?.inputReference) { + if (typeof options.inputReference === 'string') { + body.input_reference = options.inputReference + } else { + body.input_reference = { + data: options.inputReference.data, + ...(options.inputReference.mimeType ? { mime_type: options.inputReference.mimeType } : {}) + } + } + } + + const requestBodyShape = resolveOpenAICompatibleVideoRequestBodyShape({ + providerId: provider.id, + providerApiType: provider.apiType, + baseUrl: provider.baseUrl, + modelId + }) + + if (requestBodyShape === 'flat-top-level') { + const content = buildVideoGenerationContent(options) + if (content) { + body.content = content + } + if (options?.ratio) { + body.ratio = options.ratio.trim() + } + const duration = resolveFlatTopLevelVideoDuration(options) + if (duration !== undefined) { + body.duration = duration + } + if (options?.resolution) { + body.resolution = options.resolution.trim() + } + if (typeof options?.watermark === 'boolean') { + body.watermark = options.watermark + } + if (typeof options?.generateAudio === 'boolean') { + body.generate_audio = options.generateAudio + } + + return body + } + + const extraBody = buildVideoGenerationExtraBody(options) + if (extraBody) { + body.extra_body = extraBody + } + + return body +} + +function extractVideoTaskError(response: VideoGenerationTaskResponse | null | undefined): string { + const error = response?.error + if (typeof error === 'string' && error.trim()) { + return error.trim() + } + + if ( + error && + typeof error === 'object' && + typeof error.message === 'string' && + error.message.trim() + ) { + return error.message.trim() + } + + return 'Video generation failed' +} + +function resolveVideoTaskStatus(response: VideoGenerationTaskResponse | null | undefined): string { + return typeof response?.status === 'string' ? response.status.trim().toLowerCase() : '' +} + +function delayWithAbort(ms: number, signal: AbortSignal): Promise { + return new Promise((resolve, reject) => { + if (signal.aborted) { + reject(signal.reason instanceof Error ? signal.reason : new Error('Aborted')) + return + } + + const onAbort = () => { + clearTimeout(timeoutId) + signal.removeEventListener('abort', onAbort) + reject(signal.reason instanceof Error ? signal.reason : new Error('Aborted')) + } + + const timeoutId = setTimeout(() => { + signal.removeEventListener('abort', onAbort) + resolve() + }, ms) + + signal.addEventListener('abort', onAbort, { once: true }) + }) +} + +async function executeOpenAICompatibleVideoGeneration( + provider: LLM_PROVIDER, + defaultHeaders: Record, + modelId: string, + prompt: string, + modelConfig: ModelConfig, + timeout: number | undefined +): Promise<{ base64: string; mimeType: string }> { + const normalizedOptions = resolveVideoGenerationRequestOptions( + prompt, + modelId, + modelConfig.videoGeneration + ) + const baseUrl = normalizeOpenAICompatibleBaseUrl(provider.baseUrl) + const createUrl = `${baseUrl}/videos` + const body = buildVideoGenerationRequestBody(provider, modelId, prompt, normalizedOptions) + const controller = new AbortController() + const timeoutId = timeout ? setTimeout(() => controller.abort(), timeout) : undefined + const proxyUrl = proxyConfig.getProxyUrl() + const dispatcher = proxyUrl ? new ProxyAgent(proxyUrl) : undefined + + const fetchJson = async (url: string, init: RequestInit): Promise => { + const fetchInit: RequestInit & { dispatcher?: ProxyAgent } = { + ...init, + headers: { + ...defaultHeaders, + Authorization: `Bearer ${provider.oauthToken || provider.apiKey || ''}`, + ...(init.headers as Record | undefined) + }, + signal: controller.signal + } + if (dispatcher) fetchInit.dispatcher = dispatcher + + const response = await fetch(url, fetchInit) + if (!response.ok) { + const errorText = await response.text().catch(() => '') + throw new Error(`Video request failed (${response.status}): ${errorText}`) + } + + return (await response.json()) as T + } + + const fetchBinary = async (url: string): Promise<{ buffer: ArrayBuffer; mimeType: string }> => { + const fetchInit: RequestInit & { dispatcher?: ProxyAgent } = { + method: 'GET', + headers: { + ...defaultHeaders, + Authorization: `Bearer ${provider.oauthToken || provider.apiKey || ''}` + }, + signal: controller.signal + } + if (dispatcher) fetchInit.dispatcher = dispatcher + + const response = await fetch(url, fetchInit) + if (!response.ok) { + const errorText = await response.text().catch(() => '') + throw new Error(`Video content download failed (${response.status}): ${errorText}`) + } + + return { + buffer: await response.arrayBuffer(), + mimeType: response.headers.get('content-type')?.split(';')[0]?.trim() || 'video/mp4' + } + } + + try { + let task = await fetchJson(createUrl, { + method: 'POST', + headers: { + 'Content-Type': 'application/json' + }, + body: JSON.stringify(body) + }) + + const taskId = typeof task.id === 'string' ? task.id.trim() : '' + if (!taskId) { + throw new Error('Video generation response missing task id') + } + + let status = resolveVideoTaskStatus(task) + while (status !== 'completed') { + if (status === 'failed') { + throw new Error(extractVideoTaskError(task)) + } + + await delayWithAbort(VIDEO_GENERATION_POLL_INTERVAL_MS, controller.signal) + task = await fetchJson( + `${createUrl}/${encodeURIComponent(taskId)}`, + { + method: 'GET' + } + ) + status = resolveVideoTaskStatus(task) + } + + const contentUrl = + typeof task.url === 'string' && task.url.trim().length > 0 + ? task.url.trim() + : `${createUrl}/${encodeURIComponent(taskId)}/content` + const { buffer, mimeType } = await fetchBinary(contentUrl) + + return { + base64: Buffer.from(buffer).toString('base64'), + mimeType + } + } finally { + if (timeoutId !== undefined) { + clearTimeout(timeoutId) + } + } +} + async function buildPromptRuntime( context: AiSdkRuntimeContext, messages: ChatMessage[], @@ -398,6 +1217,97 @@ export async function* runAiSdkCoreStream( const normalizedModelConfig = normalizeRuntimeModelConfig(context, modelId, modelConfig) const timeout = resolveRequestTimeout(normalizedModelConfig) + if (shouldUseTtsRuntime(context, modelId, normalizedModelConfig)) { + const text = extractTtsText(messages) + const usePatternB = isChatAudioTtsModel(modelId) + const usePatternC = isGeminiGenerateContentTtsModel(modelId) + + const { base64, mimeType } = usePatternC + ? await executeTtsPatternC( + context.provider, + context.defaultHeaders, + text, + modelId, + normalizedModelConfig, + timeout + ) + : usePatternB + ? await executeTtsPatternB( + context.provider, + context.defaultHeaders, + text, + modelId, + normalizedModelConfig, + timeout + ) + : await executeTtsPatternA( + context.provider, + context.defaultHeaders, + text, + modelId, + normalizedModelConfig, + timeout + ) + + const dataUrl = `data:${mimeType};base64,${base64}` + const cachedAudio = await presenter.devicePresenter.cacheImage(dataUrl) + yield { + type: 'image_data', + image_data: { + data: cachedAudio, + mimeType + } + } + yield { + type: 'stop', + stop_reason: 'complete' + } + return + } + + if (shouldUseVideoGenerationRuntime(context, modelId, normalizedModelConfig)) { + const prompt = extractVideoPrompt(messages) + const normalizedVideoOptions = resolveVideoGenerationRequestOptions( + prompt, + modelId, + normalizedModelConfig.videoGeneration + ) + const requestBody = buildVideoGenerationRequestBody( + context.provider, + modelId, + prompt, + normalizedVideoOptions + ) + + await context.emitRequestTrace?.(normalizedModelConfig, { + endpoint: `${normalizeOpenAICompatibleBaseUrl(context.provider.baseUrl)}/videos`, + headers: context.buildTraceHeaders?.() ?? context.defaultHeaders, + body: requestBody + }) + + const { base64, mimeType } = await executeOpenAICompatibleVideoGeneration( + context.provider, + context.defaultHeaders, + modelId, + prompt, + normalizedModelConfig, + timeout + ) + + yield { + type: 'image_data', + image_data: { + data: `data:${mimeType};base64,${base64}`, + mimeType + } + } + yield { + type: 'stop', + stop_reason: 'complete' + } + return + } + if (shouldUseImageGenerationRuntime(context, modelId, normalizedModelConfig)) { const prompt = extractImagePrompt(messages) diff --git a/src/main/presenter/llmProviderPresenter/index.ts b/src/main/presenter/llmProviderPresenter/index.ts index a1c100a2c..b7bab7c04 100644 --- a/src/main/presenter/llmProviderPresenter/index.ts +++ b/src/main/presenter/llmProviderPresenter/index.ts @@ -9,6 +9,7 @@ import { KeyStatus, LLM_EMBEDDING_ATTRS, StandaloneImageGenerationResult, + StandaloneVideoGenerationResult, ModelScopeMcpSyncOptions, ModelScopeMcpSyncResult, IConfigPresenter, @@ -24,6 +25,10 @@ import { normalizeImageGenerationOptions, type ImageGenerationOptions } from '@shared/imageGenerationSettings' +import { + normalizeVideoGenerationOptions, + type VideoGenerationOptions +} from '@shared/videoGenerationSettings' import { ProviderChange, ProviderBatchUpdate } from '@shared/provider-operations' import { isProviderDbBackedProvider } from '@shared/providerDbCatalog' import { eventBus } from '@/eventbus' @@ -538,6 +543,89 @@ export class LLMProviderPresenter implements ILlmProviderPresenter { } } + async generateVideoStandalone( + providerId: string, + prompt: string, + modelId: string, + videoOptions?: VideoGenerationOptions, + options?: { signal?: AbortSignal } + ): Promise { + const normalizedPrompt = prompt.trim() + if (!normalizedPrompt) { + throw new Error('Video generation prompt is required') + } + + const signal = options?.signal + if (signal?.aborted) { + throw createAbortError() + } + + await this.executeWithRateLimit(providerId, { signal }) + + const provider = this.getProviderInstance(providerId) + const modelConfig = this.configPresenter.getModelConfig(modelId, providerId) + const mergedVideoOptions = normalizeVideoGenerationOptions({ + ...modelConfig.videoGeneration, + ...videoOptions + }) + const resolvedModelConfig: ModelConfig = { + ...modelConfig, + type: ModelType.VideoGeneration, + apiEndpoint: ApiEndpointType.Video, + videoGeneration: mergedVideoOptions + } + const stream = provider.coreStream( + [{ role: 'user', content: normalizedPrompt }], + modelId, + resolvedModelConfig, + modelConfig.temperature ?? 0.7, + modelConfig.maxTokens ?? 1024, + [] + ) + const videos: StandaloneVideoGenerationResult['videos'] = [] + const abort = createAbortPromise(signal, () => { + void stream.return?.(undefined as never) + }) + + const collect = async () => { + for await (const event of stream) { + if (signal?.aborted) { + throw createAbortError() + } + + if ( + event.type === 'image_data' && + event.image_data.mimeType.trim().toLowerCase().startsWith('video/') + ) { + videos.push({ + data: event.image_data.data, + mimeType: event.image_data.mimeType + }) + } + if (event.type === 'error') { + throw new Error(event.error_message) + } + } + } + + try { + await (abort.promise ? Promise.race([collect(), abort.promise]) : collect()) + } finally { + abort.cleanup() + } + + if (videos.length === 0) { + throw new Error('Video generation completed without video output') + } + + return { + providerId, + modelId, + ...(mergedVideoOptions ? { options: mergedVideoOptions } : {}), + videos + } + } + // 配置相关方法 setMaxConcurrentStreams(max: number): void { this.config.maxConcurrentStreams = max diff --git a/src/main/presenter/llmProviderPresenter/providers/aiSdkProvider.ts b/src/main/presenter/llmProviderPresenter/providers/aiSdkProvider.ts index 8c87ba909..37efbd9a9 100644 --- a/src/main/presenter/llmProviderPresenter/providers/aiSdkProvider.ts +++ b/src/main/presenter/llmProviderPresenter/providers/aiSdkProvider.ts @@ -7,6 +7,8 @@ import { resolveProviderCapabilityProviderId, type NewApiEndpointType } from '@shared/model' +import { isTtsModelConfig, isTtsModelId } from '@shared/ttsSettings' +import { isVideoGenerationModelConfig } from '@shared/videoGenerationSettings' import { DEFAULT_MODEL_CONTEXT_LENGTH, DEFAULT_MODEL_MAX_TOKENS, @@ -95,6 +97,15 @@ const shouldUseOpenAIImageGenerationRoute = (modelId: string, modelConfig: Model modelConfig.apiEndpoint === ApiEndpointType.Image || modelConfig.type === ModelType.ImageGeneration +const shouldUseOpenAIVideoGenerationRoute = (modelId: string, modelConfig: ModelConfig): boolean => + modelConfig.apiEndpoint === ApiEndpointType.Video || + isVideoGenerationModelConfig(modelConfig, modelId) + +const shouldUseOpenAITtsRoute = (modelId: string, modelConfig: ModelConfig): boolean => + isTtsModelConfig(modelConfig) || + modelConfig.apiEndpoint === ApiEndpointType.AudioSpeech || + isTtsModelId(modelId) + export function normalizeExtractedImageText(content: string): string { const normalized = content .replace(/\r\n/g, '\n') @@ -345,6 +356,27 @@ export class AiSdkProvider extends BaseLLMProvider { endpointType: 'image-generation' } } + case 'video-generation': + return { + providerKind: 'openai-compatible', + endpointType, + providerPatch: { + apiType: 'openai-completions', + baseUrl: `${host}/v1`, + capabilityProviderId: resolveProviderCapabilityProviderId( + this.provider.id, + { + endpointType + }, + modelId + ) + }, + modelConfigPatch: { + apiEndpoint: ApiEndpointType.Video, + type: ModelType.VideoGeneration, + endpointType: 'video-generation' + } + } case 'openai': default: return { @@ -569,6 +601,27 @@ export class AiSdkProvider extends BaseLLMProvider { isOpenAIImageGenerationModel(runtimeModelId) || runtimeModelConfig.apiEndpoint === ApiEndpointType.Image + const shouldUseVideoGeneration = + this.isAzureOpenAI(decision, runtimeProvider) || + decision.providerKind === 'gemini' || + decision.providerKind === 'vertex' || + decision.providerKind === 'anthropic' + ? undefined + : decision.endpointType === 'video-generation' + ? () => true + : (runtimeModelId: string, runtimeModelConfig: ModelConfig) => + shouldUseOpenAIVideoGenerationRoute(runtimeModelId, runtimeModelConfig) + + // TTS route: only applicable for OpenAI-compatible providers (not Azure, Gemini, Vertex) + const shouldUseTts = + this.isAzureOpenAI(decision, runtimeProvider) || + decision.providerKind === 'gemini' || + decision.providerKind === 'vertex' || + decision.providerKind === 'anthropic' + ? undefined + : (runtimeModelId: string, runtimeModelConfig: ModelConfig) => + shouldUseOpenAITtsRoute(runtimeModelId, runtimeModelConfig) + return { decision, resolvedModelConfig, @@ -585,7 +638,9 @@ export class AiSdkProvider extends BaseLLMProvider { cleanHeaders, supportsNativeTools: (_runtimeModelId, runtimeModelConfig) => runtimeModelConfig.functionCall === true, - shouldUseImageGeneration + shouldUseImageGeneration, + shouldUseVideoGeneration, + shouldUseTts } } } @@ -1656,13 +1711,22 @@ export class AiSdkProvider extends BaseLLMProvider { normalizedRawType === 'image' || supportedEndpointTypes.includes('image-generation') ? ModelType.ImageGeneration - : normalizedRawType === 'embedding' || - normalizedRawType === 'embeddings' || - normalizedModelId.includes('embedding') - ? ModelType.Embedding - : normalizedRawType === 'rerank' || normalizedModelId.includes('rerank') - ? ModelType.Rerank - : undefined + : normalizedRawType === 'videogeneration' || + normalizedRawType === 'video-generation' || + normalizedRawType === 'video' || + supportedEndpointTypes.includes('video-generation') + ? ModelType.VideoGeneration + : normalizedRawType === 'tts' || + normalizedRawType === 'audio-speech' || + normalizedRawType === 'audiospeech' + ? ModelType.TTS + : normalizedRawType === 'embedding' || + normalizedRawType === 'embeddings' || + normalizedModelId.includes('embedding') + ? ModelType.Embedding + : normalizedRawType === 'rerank' || normalizedModelId.includes('rerank') + ? ModelType.Rerank + : undefined const contextLengthCandidate = [ rawModel.context_length, @@ -1687,7 +1751,9 @@ export class AiSdkProvider extends BaseLLMProvider { supportedEndpointTypes.length === 0 ? type === ModelType.ImageGeneration ? 'image-generation' - : undefined + : type === ModelType.VideoGeneration + ? 'video-generation' + : undefined : resolveNewApiEndpointTypeFromRoute( { supportedEndpointTypes, @@ -1725,7 +1791,11 @@ export class AiSdkProvider extends BaseLLMProvider { ...existingConfig, type: model.type ?? existingConfig.type, apiEndpoint: - model.endpointType === 'image-generation' ? ApiEndpointType.Image : ApiEndpointType.Chat, + model.endpointType === 'image-generation' + ? ApiEndpointType.Image + : model.type === ModelType.TTS + ? ApiEndpointType.AudioSpeech + : ApiEndpointType.Chat, endpointType: model.endpointType ?? existingConfig.endpointType }) } diff --git a/src/main/presenter/sqlitePresenter/tables/deepchatSessions.ts b/src/main/presenter/sqlitePresenter/tables/deepchatSessions.ts index 779dfa71f..7993f9742 100644 --- a/src/main/presenter/sqlitePresenter/tables/deepchatSessions.ts +++ b/src/main/presenter/sqlitePresenter/tables/deepchatSessions.ts @@ -12,6 +12,10 @@ import { normalizeImageGenerationOptions, type ImageGenerationOptions } from '@shared/imageGenerationSettings' +import { + normalizeVideoGenerationOptions, + type VideoGenerationOptions +} from '@shared/videoGenerationSettings' type DeepChatSessionGenerationSettings = Pick< SessionGenerationSettings, @@ -26,6 +30,7 @@ type DeepChatSessionGenerationSettings = Pick< | 'verbosity' | 'forceInterleavedThinkingCompat' | 'imageGeneration' + | 'videoGeneration' > export interface DeepChatSessionRow { @@ -44,6 +49,7 @@ export interface DeepChatSessionRow { verbosity: 'low' | 'medium' | 'high' | null force_interleaved_thinking_compat: number | null image_generation_options_json: string | null + video_generation_options_json: string | null summary_text: string | null summary_cursor_order_seq: number | null summary_updated_at: number | null @@ -109,6 +115,10 @@ export class DeepChatSessionsTable extends BaseTable { columns.push('image_generation_options_json TEXT') } + if (version >= 28) { + columns.push('video_generation_options_json TEXT') + } + if (version >= 14) { columns.push( 'summary_text TEXT', @@ -187,6 +197,11 @@ export class DeepChatSessionsTable extends BaseTable { 'ALTER TABLE deepchat_sessions ADD COLUMN image_generation_options_json TEXT;' ) } + if (!this.hasColumn('video_generation_options_json')) { + statements.push( + 'ALTER TABLE deepchat_sessions ADD COLUMN video_generation_options_json TEXT;' + ) + } return statements } @@ -230,11 +245,14 @@ export class DeepChatSessionsTable extends BaseTable { if (version === 27) { return 'ALTER TABLE deepchat_sessions ADD COLUMN image_generation_options_json TEXT;' } + if (version === 28) { + return 'ALTER TABLE deepchat_sessions ADD COLUMN video_generation_options_json TEXT;' + } return null } getLatestVersion(): number { - return 27 + return 28 } private serializeImageGenerationOptions( @@ -257,6 +275,26 @@ export class DeepChatSessionsTable extends BaseTable { } } + private serializeVideoGenerationOptions( + value: VideoGenerationOptions | undefined + ): string | null { + const normalized = normalizeVideoGenerationOptions(value) + return normalized ? JSON.stringify(normalized) : null + } + + private parseVideoGenerationOptions(value: string | null): VideoGenerationOptions | undefined { + if (!value) { + return undefined + } + + try { + const parsed = JSON.parse(value) as VideoGenerationOptions + return normalizeVideoGenerationOptions(parsed) + } catch { + return undefined + } + } + create( id: string, providerId: string, @@ -282,11 +320,12 @@ export class DeepChatSessionsTable extends BaseTable { verbosity, force_interleaved_thinking_compat, image_generation_options_json, + video_generation_options_json, summary_text, summary_cursor_order_seq, summary_updated_at ) - VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)` + VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)` ) .run( id, @@ -308,6 +347,7 @@ export class DeepChatSessionsTable extends BaseTable { ? 1 : 0, this.serializeImageGenerationOptions(generationSettings?.imageGeneration), + this.serializeVideoGenerationOptions(generationSettings?.videoGeneration), null, 1, null @@ -362,6 +402,10 @@ export class DeepChatSessionsTable extends BaseTable { if (imageGeneration) { settings.imageGeneration = imageGeneration } + const videoGeneration = this.parseVideoGenerationOptions(row.video_generation_options_json) + if (videoGeneration) { + settings.videoGeneration = videoGeneration + } return settings } @@ -430,6 +474,10 @@ export class DeepChatSessionsTable extends BaseTable { updates.push('image_generation_options_json = ?') params.push(this.serializeImageGenerationOptions(settings.imageGeneration)) } + if (Object.prototype.hasOwnProperty.call(settings, 'videoGeneration')) { + updates.push('video_generation_options_json = ?') + params.push(this.serializeVideoGenerationOptions(settings.videoGeneration)) + } if (updates.length === 0) { return diff --git a/src/main/presenter/toolPresenter/agentTools/agentPlanTool.ts b/src/main/presenter/toolPresenter/agentTools/agentPlanTool.ts new file mode 100644 index 000000000..a2c4447c0 --- /dev/null +++ b/src/main/presenter/toolPresenter/agentTools/agentPlanTool.ts @@ -0,0 +1,158 @@ +import { z } from 'zod' +import { zodToJsonSchema } from 'zod-to-json-schema' +import type { MCPToolDefinition } from '@shared/presenter' +import type { AgentToolProgressUpdate } from '@shared/types/presenters/tool.presenter' +import type { AgentPlanState, AgentPlanSnapshot, UpdatePlanArgs } from '@shared/types/agent-plan' + +export const UPDATE_PLAN_TOOL_NAME = 'update_plan' +export const AGENT_CORE_TOOL_SERVER_NAME = 'agent-core' + +const MAX_PLAN_ITEMS = 12 + +const planItemSchema = z + .object({ + step: z + .string() + .transform((value) => value.trim()) + .refine((value) => value.length > 0, 'step must be a non-empty string'), + status: z.enum(['pending', 'in_progress', 'completed']) + }) + .strict() + +export const updatePlanToolArgsSchema = z + .object({ + explanation: z.string().optional(), + plan: z.array(planItemSchema).max(MAX_PLAN_ITEMS) + }) + .strict() + .superRefine((value, context) => { + const inProgressCount = value.plan.filter((item) => item.status === 'in_progress').length + if (inProgressCount > 1) { + context.addIssue({ + code: z.ZodIssueCode.custom, + path: ['plan'], + message: 'at most one step can be in_progress' + }) + } + }) + +export interface AgentPlanToolCallOptions { + toolCallId?: string + onProgress?: (update: AgentToolProgressUpdate) => void +} + +const formatValidationError = (error: z.ZodError): string => { + const firstIssue = error.issues[0] + if (!firstIssue) { + return 'invalid update_plan arguments' + } + + const path = firstIssue.path.length > 0 ? `${firstIssue.path.join('.')}: ` : '' + return `invalid update_plan arguments: ${path}${firstIssue.message}` +} + +export class AgentPlanTool { + private readonly states = new Map() + + getToolDefinition(): MCPToolDefinition { + return { + type: 'function', + function: { + name: UPDATE_PLAN_TOOL_NAME, + description: + 'Update the visible progress checklist for the current multi-step task. Provide the complete current plan snapshot every time. Use short, concrete, verifiable steps. At most one step may be in_progress.', + parameters: zodToJsonSchema(updatePlanToolArgsSchema) as { + type: string + properties: Record + required?: string[] + } + }, + server: { + name: AGENT_CORE_TOOL_SERVER_NAME, + icons: 'list-checks', + description: 'Agent core tools' + } + } + } + + call( + args: Record, + conversationId?: string, + options?: AgentPlanToolCallOptions + ): { content: string; rawData: { content: string; isError: boolean; toolResult: unknown } } { + const sessionId = conversationId?.trim() + if (!sessionId) { + throw new Error('update_plan requires a conversation ID') + } + + const validationResult = updatePlanToolArgsSchema.safeParse(args) + if (!validationResult.success) { + throw new Error(formatValidationError(validationResult.error)) + } + + const normalizedArgs = this.normalizeArgs(validationResult.data) + const previous = this.states.get(sessionId) + const revision = (previous?.revision ?? 0) + 1 + const updatedAt = new Date().toISOString() + const toolCallId = options?.toolCallId?.trim() || undefined + const snapshot: AgentPlanSnapshot = { + sessionId, + ...(toolCallId ? { toolCallId } : {}), + ...(normalizedArgs.explanation ? { explanation: normalizedArgs.explanation } : {}), + plan: normalizedArgs.plan, + revision, + updatedAt + } + + this.states.set(sessionId, { + current: normalizedArgs, + revision, + updatedAt + }) + + if (toolCallId) { + options?.onProgress?.({ + kind: 'agent_plan', + toolCallId, + snapshot + }) + } + + return { + content: '{}', + rawData: { + content: '{}', + isError: false, + toolResult: { + kind: 'agent_plan', + snapshot + } + } + } + } + + getState(conversationId: string): AgentPlanState { + return ( + this.states.get(conversationId) ?? { + current: null, + revision: 0, + updatedAt: null + } + ) + } + + clearState(conversationId: string): void { + this.states.delete(conversationId) + } + + private normalizeArgs(args: z.output): UpdatePlanArgs { + const explanation = args.explanation?.trim() + return { + ...(explanation ? { explanation } : {}), + plan: args.plan.map((item) => ({ + step: item.step, + status: item.status + })) + } + } +} diff --git a/src/main/presenter/toolPresenter/agentTools/agentToolManager.ts b/src/main/presenter/toolPresenter/agentTools/agentToolManager.ts index c20da81e8..c1c239c29 100644 --- a/src/main/presenter/toolPresenter/agentTools/agentToolManager.ts +++ b/src/main/presenter/toolPresenter/agentTools/agentToolManager.ts @@ -28,6 +28,7 @@ import { SubagentOrchestratorTool } from './subagentOrchestratorTool' import { AgentImageGenerationTool, IMAGE_GENERATE_TOOL_NAME } from './agentImageGenerationTool' +import { AgentPlanTool, UPDATE_PLAN_TOOL_NAME } from './agentPlanTool' // Consider moving to a shared handlers location in future refactoring import { @@ -121,6 +122,7 @@ export class AgentToolManager { private chatSettingsHandler: ChatSettingsToolHandler | null = null private subagentOrchestratorTool: SubagentOrchestratorTool | null = null private imageGenerationTool: AgentImageGenerationTool | null = null + private planTool: AgentPlanTool | null = null private static readonly READ_FILE_AUTO_TRUNCATE_THRESHOLD = 4500 private readonly fileSystemSchemas = { @@ -285,6 +287,7 @@ export class AgentToolManager { configPresenter: this.configPresenter, runtimePort: this.runtimePort }) + this.planTool = new AgentPlanTool() if (this.agentWorkspacePath) { this.fileSystemHandler = new AgentFileSystemHandler([this.agentWorkspacePath]) this.bashHandler = new AgentBashHandler( @@ -345,6 +348,11 @@ export class AgentToolManager { // 2. Built-in question tool (all modes) defs.push(...this.getQuestionToolDefinitions()) + // 2.1. Progress checklist tool (deepchat regular sessions only) + if (isAgentMode && this.planTool) { + defs.push(this.planTool.getToolDefinition()) + } + // 2.25. Image generation tool (deepchat agent sessions with an image model) if (isAgentMode && this.imageGenerationTool) { try { @@ -430,6 +438,17 @@ export class AgentToolManager { conversationId?: string, options?: AgentToolExecutionOptions ): Promise { + if (toolName === UPDATE_PLAN_TOOL_NAME) { + if (!this.planTool) { + throw new Error('Progress tool is not available.') + } + + return this.planTool.call(args, conversationId, { + toolCallId: options?.toolCallId, + onProgress: options?.onProgress + }) + } + if (toolName === QUESTION_TOOL_NAME) { const validationResult = questionToolSchema.safeParse(args) if (!validationResult.success) { diff --git a/src/main/presenter/toolPresenter/agentTools/index.ts b/src/main/presenter/toolPresenter/agentTools/index.ts index e6a0dff9f..e91f1cfb8 100644 --- a/src/main/presenter/toolPresenter/agentTools/index.ts +++ b/src/main/presenter/toolPresenter/agentTools/index.ts @@ -11,3 +11,4 @@ export { CHAT_SETTINGS_SKILL_NAME, CHAT_SETTINGS_TOOL_NAMES } from './chatSettingsTools' +export { AGENT_CORE_TOOL_SERVER_NAME, UPDATE_PLAN_TOOL_NAME, AgentPlanTool } from './agentPlanTool' diff --git a/src/main/presenter/toolPresenter/index.ts b/src/main/presenter/toolPresenter/index.ts index 6d876919d..e7195bde3 100644 --- a/src/main/presenter/toolPresenter/index.ts +++ b/src/main/presenter/toolPresenter/index.ts @@ -10,7 +10,12 @@ import type { PermissionMode } from '@shared/types/agent-interface' import { resolveToolOffloadTemplatePath } from '@/lib/agentRuntime/sessionPaths' import { QUESTION_TOOL_NAME } from '@/lib/agentRuntime/questionTool' import { ToolMapper, type ToolSource } from './toolMapper' -import { AgentToolManager, IMAGE_GENERATE_TOOL_NAME, type AgentToolCallResult } from './agentTools' +import { + AgentToolManager, + IMAGE_GENERATE_TOOL_NAME, + UPDATE_PLAN_TOOL_NAME, + type AgentToolCallResult +} from './agentTools' import type { AgentToolRuntimePort } from './runtimePorts' import { createAgentToolErrorResult, @@ -89,7 +94,8 @@ const FILESYSTEM_TOOL_ORDER = ['read', 'write', 'edit', 'exec', 'process'] const OFFLOAD_TOOL_NAMES = new Set(['exec', 'cdp_send']) const RESERVED_AGENT_TOOL_NAMES = new Set([ ...YO_BROWSER_TOOL_NAMES, - IMAGE_GENERATE_TOOL_NAME + IMAGE_GENERATE_TOOL_NAME, + UPDATE_PLAN_TOOL_NAME ]) const withToolSource = (tools: MCPToolDefinition[], source: 'mcp' | 'agent'): MCPToolDefinition[] => @@ -453,6 +459,7 @@ export class ToolPresenter implements IToolPresenter { this.buildFilesystemPrompt(toolNames, offloadPath), this.buildQuestionPrompt(toolNames), this.buildImageGenerationPrompt(toolNames), + this.buildProgressPrompt(toolNames), this.buildSkillsPrompt(toolNames), this.buildSettingsPrompt(groupedTools.get('deepchat-settings') ?? []), this.buildYoBrowserPrompt(groupedTools.get('yobrowser') ?? []) @@ -606,6 +613,24 @@ export class ToolPresenter implements IToolPresenter { ].join('\n') } + private buildProgressPrompt(toolNames: Set): string { + if (!toolNames.has(UPDATE_PLAN_TOOL_NAME)) { + return '' + } + + return [ + '## Progress Checklist Tool', + `Use \`${UPDATE_PLAN_TOOL_NAME}\` for non-trivial multi-step tasks.`, + 'Skip it for simple one-shot answers or trivial edits.', + 'Each call must provide the complete current checklist snapshot.', + 'Keep each step short, concrete, and verifiable.', + 'Keep the checklist current as work progresses.', + 'At most one step may be in_progress at a time.', + 'When a step completes, update the checklist immediately and move the next active step to in_progress in the same call.', + 'Use explanation only when the plan changes materially or progress would otherwise be unclear.' + ].join('\n') + } + private buildSettingsPrompt(tools: MCPToolDefinition[]): string { if (tools.length === 0) { return '' diff --git a/src/renderer/api/ChatClient.ts b/src/renderer/api/ChatClient.ts index 303cbafb1..d6bb6f54c 100644 --- a/src/renderer/api/ChatClient.ts +++ b/src/renderer/api/ChatClient.ts @@ -1,5 +1,6 @@ import type { DeepchatBridge } from '@shared/contracts/bridge' import { + chatPlanUpdatedEvent, chatStreamCompletedEvent, chatStreamFailedEvent, chatStreamUpdatedEvent, @@ -66,6 +67,10 @@ export function createChatClient(bridge: DeepchatBridge = getDeepchatBridge()) { return bridge.on(chatStreamFailedEvent.name, listener) } + function onPlanUpdated(listener: (payload: DeepchatEventPayload<'chat.plan.updated'>) => void) { + return bridge.on(chatPlanUpdatedEvent.name, listener) + } + return { sendMessage, steerActiveTurn, @@ -73,7 +78,8 @@ export function createChatClient(bridge: DeepchatBridge = getDeepchatBridge()) { respondToolInteraction, onStreamUpdated, onStreamCompleted, - onStreamFailed + onStreamFailed, + onPlanUpdated } } diff --git a/src/renderer/settings/components/DeepChatAgentsSettings.vue b/src/renderer/settings/components/DeepChatAgentsSettings.vue index d282ce06e..9228442b9 100644 --- a/src/renderer/settings/components/DeepChatAgentsSettings.vue +++ b/src/renderer/settings/components/DeepChatAgentsSettings.vue @@ -1301,8 +1301,13 @@ const startCreate = () => { assignForm(emptyForm()) } const resetEditor = () => { - if (selectedAgentId.value === DRAFT_AGENT_ID) startCreate() - else selectAgent(selectedAgentId.value) + const agentId = selectedAgentId.value + if (!agentId || agentId === DRAFT_AGENT_ID) { + startCreate() + return + } + + selectAgent(agentId) } const saveAgent = async () => { if (!form.name.trim()) return diff --git a/src/renderer/settings/components/ProviderModelList.vue b/src/renderer/settings/components/ProviderModelList.vue index 4e0c41a86..2be6bd096 100644 --- a/src/renderer/settings/components/ProviderModelList.vue +++ b/src/renderer/settings/components/ProviderModelList.vue @@ -376,7 +376,9 @@ const TYPE_ORDER: ModelType[] = [ ModelType.Chat, ModelType.Embedding, ModelType.Rerank, - ModelType.ImageGeneration + ModelType.ImageGeneration, + ModelType.VideoGeneration, + ModelType.TTS ] const CAPABILITY_ICONS: Record = { @@ -390,7 +392,9 @@ const TYPE_ICONS: Record = { [ModelType.Chat]: 'lucide:messages-square', [ModelType.Embedding]: 'lucide:database', [ModelType.Rerank]: 'lucide:arrow-up-wide-narrow', - [ModelType.ImageGeneration]: 'lucide:image' + [ModelType.ImageGeneration]: 'lucide:image', + [ModelType.VideoGeneration]: 'lucide:clapperboard', + [ModelType.TTS]: 'lucide:volume-2' } const props = defineProps<{ @@ -450,7 +454,12 @@ const hasModelCapability = (model: RENDERER_MODEL_META, capability: ModelCapabil } } -const getModelTypeLabel = (type: ModelType) => t(`model.filter.typeOptions.${type}`) +const getModelTypeLabel = (type: ModelType) => { + if (type === ModelType.TTS) { + return t('settings.provider.tts.title') + } + return t(`model.filter.typeOptions.${type}`) +} const getCapabilityLabel = (capability: ModelCapabilityKey) => t(`model.filter.capabilityOptions.${capability}`) @@ -704,13 +713,15 @@ type VirtualModelListItem = enableSearch: boolean typeValue: ModelType group: string - contextLength: number - maxTokens: number + contextLength: RENDERER_MODEL_META['contextLength'] + maxTokens: RENDERER_MODEL_META['maxTokens'] isCustom: boolean supportedEndpointTypes: RENDERER_MODEL_META['supportedEndpointTypes'] endpointType: RENDERER_MODEL_META['endpointType'] } +type VirtualModelItem = Extract + const getCachedVirtualItem = ( id: string, factory: () => TItem, @@ -763,7 +774,7 @@ const createProviderActionsItem = (providerId: string) => ) const createModelItem = (model: RENDERER_MODEL_META) => - getCachedVirtualItem( + getCachedVirtualItem( `${model.providerId}-${model.id}`, () => ({ id: `${model.providerId}-${model.id}`, @@ -914,9 +925,7 @@ const getBatchTargetModels = (providerId: string) => { return Array.from(dedupedModels.values()) } -const toRendererModel = ( - item: Extract -): RENDERER_MODEL_META => ({ +const toRendererModel = (item: VirtualModelItem): RENDERER_MODEL_META => ({ id: item.modelId, name: item.name, contextLength: item.contextLength, diff --git a/src/renderer/settings/components/RemoteSettings.vue b/src/renderer/settings/components/RemoteSettings.vue index 469900a14..ef2eec863 100644 --- a/src/renderer/settings/components/RemoteSettings.vue +++ b/src/renderer/settings/components/RemoteSettings.vue @@ -2340,16 +2340,27 @@ const syncWeixinIlinkFields = (snapshot: Partial | nu } } -const channelStatus = (channel: RemoteChannel) => - channel === 'telegram' - ? telegramStatus.value - : channel === 'feishu' - ? feishuStatus.value - : channel === 'qqbot' - ? qqbotStatus.value - : channel === 'discord' - ? discordStatus.value - : weixinIlinkStatus.value +function channelStatus(channel: 'telegram'): TelegramRemoteStatus | null +function channelStatus(channel: 'feishu'): FeishuRemoteStatus | null +function channelStatus(channel: 'qqbot'): QQBotRemoteStatus | null +function channelStatus(channel: 'discord'): DiscordRemoteStatus | null +function channelStatus(channel: 'weixin-ilink'): WeixinIlinkRemoteStatus | null +function channelStatus(channel: RemoteChannel): RemoteChannelStatus | null +function channelStatus(channel: RemoteChannel): RemoteChannelStatus | null { + if (channel === 'telegram') { + return telegramStatus.value + } + if (channel === 'feishu') { + return feishuStatus.value + } + if (channel === 'qqbot') { + return qqbotStatus.value + } + if (channel === 'discord') { + return discordStatus.value + } + return weixinIlinkStatus.value +} const getSnapshotPrincipalIds = ( channel: PairableRemoteChannel, @@ -3105,12 +3116,11 @@ const bindingKindClass = (kind: RemoteBindingSummary['kind']) => { } const formatOverviewLine = (channel: RemoteChannel) => { - const status = channelStatus(channel) - if (!status) { - return '' - } - if (channel === 'telegram') { + const status = channelStatus(channel) + if (!status) { + return '' + } return t('settings.remote.overview.telegram', { bindingCount: status.bindingCount, pairedCount: status.allowedUserCount @@ -3118,6 +3128,10 @@ const formatOverviewLine = (channel: RemoteChannel) => { } if (channel === 'qqbot') { + const status = channelStatus(channel) + if (!status) { + return '' + } return t('settings.remote.overview.qqbot', { bindingCount: status.bindingCount, pairedCount: status.pairedUserCount @@ -3125,6 +3139,10 @@ const formatOverviewLine = (channel: RemoteChannel) => { } if (channel === 'discord') { + const status = channelStatus(channel) + if (!status) { + return '' + } return t('settings.remote.overview.discord', { bindingCount: status.bindingCount, pairedCount: status.pairedChannelCount @@ -3132,6 +3150,10 @@ const formatOverviewLine = (channel: RemoteChannel) => { } if (channel === 'weixin-ilink') { + const status = channelStatus(channel) + if (!status) { + return '' + } return t('settings.remote.overview.weixinIlink', { bindingCount: status.bindingCount, accountCount: status.accountCount, @@ -3139,6 +3161,11 @@ const formatOverviewLine = (channel: RemoteChannel) => { }) } + const status = channelStatus('feishu') + if (!status) { + return '' + } + return t('settings.remote.overview.feishu', { bindingCount: status.bindingCount, pairedCount: status.pairedUserCount diff --git a/src/renderer/settings/components/VoiceAIProviderConfig.vue b/src/renderer/settings/components/VoiceAIProviderConfig.vue index 8cdb2a3a8..6483142c3 100644 --- a/src/renderer/settings/components/VoiceAIProviderConfig.vue +++ b/src/renderer/settings/components/VoiceAIProviderConfig.vue @@ -6,9 +6,9 @@

@@ -18,11 +18,11 @@

- {{ t('settings.provider.voiceai.audioFormat.helper') }} + {{ t('settings.provider.tts.audioFormat.helper') }}

- {{ t('settings.provider.voiceai.language.helper') }} + {{ t('settings.provider.tts.language.helper') }}

- {{ t('settings.provider.voiceai.model.helper') }} + {{ t('settings.provider.tts.model.helper') }}

- {{ t('settings.provider.voiceai.agentId.helper') }} + {{ t('settings.provider.tts.agentId.helper') }}

@@ -95,7 +95,7 @@
{{ temperature.toFixed(2) }}
@@ -108,14 +108,14 @@ @update:model-value="onTemperatureChange" />

- {{ t('settings.provider.voiceai.temperature.helper') }} + {{ t('settings.provider.tts.temperature.helper') }}

{{ topP.toFixed(2) }}
@@ -128,7 +128,7 @@ @update:model-value="onTopPChange" />

- {{ t('settings.provider.voiceai.topP.helper') }} + {{ t('settings.provider.tts.topP.helper') }}

diff --git a/src/renderer/src/components/ChatConfig.vue b/src/renderer/src/components/ChatConfig.vue index 6b3e151db..044aaf584 100644 --- a/src/renderer/src/components/ChatConfig.vue +++ b/src/renderer/src/components/ChatConfig.vue @@ -40,7 +40,7 @@ const props = defineProps<{ providerId?: string reasoningEffort?: ReasoningEffort verbosity?: Verbosity - modelType?: 'chat' | 'imageGeneration' | 'embedding' | 'rerank' + modelType?: 'chat' | 'imageGeneration' | 'videoGeneration' | 'tts' | 'embedding' | 'rerank' }>() const systemPrompt = defineModel('systemPrompt') @@ -129,7 +129,7 @@ const { sliderFields, inputFields, selectFields } = useChatConfigFields({ watch( () => props.modelType, (newType) => { - if (newType === 'imageGeneration' && systemPrompt.value) { + if ((newType === 'imageGeneration' || newType === 'videoGeneration') && systemPrompt.value) { systemPrompt.value = '' } } @@ -140,6 +140,8 @@ const modelTypeIcon = computed(() => { const icons = { chat: 'lucide:message-circle', imageGeneration: 'lucide:image', + videoGeneration: 'lucide:clapperboard', + tts: 'lucide:volume-2', embedding: 'lucide:layers', rerank: 'lucide:arrow-up-down' } @@ -157,7 +159,13 @@ const modelTypeIcon = computed(() => {
-
+
diff --git a/src/renderer/src/components/chat/AgentProgressFloat.vue b/src/renderer/src/components/chat/AgentProgressFloat.vue new file mode 100644 index 000000000..804f929db --- /dev/null +++ b/src/renderer/src/components/chat/AgentProgressFloat.vue @@ -0,0 +1,329 @@ + + + + + diff --git a/src/renderer/src/components/chat/ChatSearchBar.vue b/src/renderer/src/components/chat/ChatSearchBar.vue index 80f9e4b7b..b04372830 100644 --- a/src/renderer/src/components/chat/ChatSearchBar.vue +++ b/src/renderer/src/components/chat/ChatSearchBar.vue @@ -16,7 +16,7 @@ autocapitalize="off" autocomplete="off" spellcheck="false" - @update:model-value="emit('update:modelValue', $event)" + @update:model-value="handleModelValueUpdate" @keydown="handleKeydown" />
@@ -115,6 +115,10 @@ const selectInput = () => { element?.select() } +const handleModelValueUpdate = (value: string | number) => { + emit('update:modelValue', String(value)) +} + const handleKeydown = (event: KeyboardEvent) => { if (event.key === 'Escape') { event.preventDefault() diff --git a/src/renderer/src/components/chat/ChatStatusBar.vue b/src/renderer/src/components/chat/ChatStatusBar.vue index dc79db218..77817d13a 100644 --- a/src/renderer/src/components/chat/ChatStatusBar.vue +++ b/src/renderer/src/components/chat/ChatStatusBar.vue @@ -103,12 +103,6 @@ :is-dark="themeStore.isDark" /> {{ displayModelText }} -
-
+
@@ -408,7 +402,7 @@

-
+
@@ -547,8 +541,15 @@ @update:model-value="onImageGenerationSettingsUpdate" /> + +
@@ -721,7 +722,7 @@

-
+