diff --git a/package.json b/package.json index b73947a4e..ed8bcc0b0 100644 --- a/package.json +++ b/package.json @@ -9,7 +9,7 @@ "node": ">=24.14.1 <25", "pnpm": ">=10.11.0" }, - "packageManager": "pnpm@10.13.1+sha512.37ebf1a5c7a30d5fabe0c5df44ee8da4c965ca0c5af3dbab28c3a1681b70a256218d05c81c9c0dcf767ef6b8551eb5b960042b9ed4300c59242336377e01cfad", + "packageManager": "pnpm@10.33.4+sha512.1c67b3b359b2d408119ba1ed289f34b8fc3c6873412bec6fd264fbdc82489e510fcbecb9ce9d22dae7f3b76269d8441046014bdca53b9979cd7a561ad631b800", "scripts": { "prebuild": "node scripts/fetch-provider-db.mjs && node scripts/fetch-acp-registry.mjs", "preinstall": "npx only-allow pnpm", @@ -73,139 +73,140 @@ }, "dependencies": { "@agentclientprotocol/sdk": "^0.16.1", - "@ai-sdk/amazon-bedrock": "^4.0.103", - "@ai-sdk/anthropic": "^3.0.76", - "@ai-sdk/azure": "^3.0.64", - "@ai-sdk/google": "^3.0.72", - "@ai-sdk/google-vertex": "^4.0.126", - "@ai-sdk/openai": "^3.0.63", + "@ai-sdk/amazon-bedrock": "^4.0.107", + "@ai-sdk/anthropic": "^3.0.78", + "@ai-sdk/azure": "^3.0.65", + "@ai-sdk/google": "^3.0.75", + "@ai-sdk/google-vertex": "^4.0.131", + "@ai-sdk/openai": "^3.0.64", "@ai-sdk/openai-compatible": "^2.0.47", "@ai-sdk/provider": "^3.0.10", - "@aws-sdk/client-bedrock": "^3.958.0", + "@aws-sdk/client-bedrock": "^3.1049.0", "@duckdb/node-api": "1.3.2-alpha.25", "@e2b/code-interpreter": "^1.5.1", "@electron-toolkit/preload": "^3.0.2", "@electron-toolkit/utils": "^4.0.0", "@jxa/run": "^1.4.0", - "@larksuiteoapi/node-sdk": "^1.60.0", - "@modelcontextprotocol/sdk": "^1.28.0", - "ai": "^6.0.177", - "axios": "^1.13.6", + "@larksuiteoapi/node-sdk": "^1.64.0", + "@modelcontextprotocol/sdk": "^1.29.0", + "ai": "^6.0.185", + "axios": "^1.16.1", "better-sqlite3-multiple-ciphers": "12.9.0", "cheerio": "^1.2.0", "chokidar": "^5.0.0", "compare-versions": "^6.1.1", "cross-spawn": "^7.0.6", "diff": "^8.0.4", - "electron-log": "^5.4.3", + "electron-log": "^5.4.4", "electron-store": "^8.2.0", "electron-updater": "^6.8.3", "electron-window-state": "^5.0.3", "es-mime-types": "^0.1.4", - "fflate": "^0.8.2", + "fflate": "^0.8.3", "font-list": "^2.0.2", "glob": "^13.0.6", "gray-matter": "^4.0.3", "https-proxy-agent": "^7.0.6", - "jsonrepair": "^3.13.3", + "jsonrepair": "^3.14.0", "mammoth": "^1.12.0", - "nanoid": "^5.1.7", + "nanoid": "^5.1.11", "node-pty": "^1.1.0", "ollama": "^0.6.3", "pdf-parse-new": "^1.4.1", "run-applescript": "^7.1.0", - "safe-regex2": "^5.1.0", + "safe-regex2": "^5.1.1", "sharp": "^0.33.5", "tokenx": "^0.4.1", - "turndown": "^7.2.2", - "undici": "^7.16.0", + "turndown": "^7.2.4", + "undici": "^7.25.0", "xlsx": "https://cdn.sheetjs.com/xlsx-0.20.3/xlsx-0.20.3.tgz", "xml2js": "^0.6.2", "zod": "^3.25.76" }, "devDependencies": { - "@antv/infographic": "^0.2.7", + "@antv/infographic": "^0.2.19", "@electron-toolkit/tsconfig": "^1.0.1", "@electron/notarize": "^3.1.1", - "@iconify-json/lucide": "^1.2.99", - "@iconify-json/vscode-icons": "^1.2.45", - "@iconify/vue": "^5.0.0", + "@iconify-json/lucide": "^1.2.108", + "@iconify-json/vscode-icons": "^1.2.49", + "@iconify/vue": "^5.0.1", "@lingual/i18n-check": "0.8.12", "@pinia/colada": "^0.20.0", - "@playwright/test": "^1.59.1", + "@playwright/test": "^1.60.0", "@tailwindcss/typography": "^0.5.19", - "@tailwindcss/vite": "^4.2.2", - "@tiptap/core": "^2.11.7", - "@tiptap/extension-code-block": "^2.11.9", - "@tiptap/extension-document": "^2.11.7", - "@tiptap/extension-hard-break": "^2.11.7", - "@tiptap/extension-history": "^2.12.0", - "@tiptap/extension-mention": "^2.11.7", - "@tiptap/extension-paragraph": "^2.11.7", - "@tiptap/extension-placeholder": "^2.11.7", - "@tiptap/extension-text": "^2.11.7", - "@tiptap/pm": "^2.11.7", - "@tiptap/suggestion": "^2.11.7", - "@tiptap/vue-3": "^2.11.7", + "@tailwindcss/vite": "^4.3.0", + "@tiptap/core": "^2.27.2", + "@tiptap/extension-code-block": "^2.27.2", + "@tiptap/extension-document": "^2.27.2", + "@tiptap/extension-hard-break": "^2.27.2", + "@tiptap/extension-history": "^2.27.2", + "@tiptap/extension-mention": "^2.27.2", + "@tiptap/extension-paragraph": "^2.27.2", + "@tiptap/extension-placeholder": "^2.27.2", + "@tiptap/extension-text": "^2.27.2", + "@tiptap/pm": "^2.27.2", + "@tiptap/suggestion": "^2.27.2", + "@tiptap/vue-3": "^2.27.2", "@types/better-sqlite3": "^7.6.13", "@types/mime-types": "^3.0.1", - "@types/node": "^24.12.2", + "@types/node": "^24.12.4", "@types/xlsx": "^0.0.35", - "@typescript/native-preview": "7.0.0-dev.20260115.1", + "@typescript/native-preview": "7.0.0-dev.20260518.1", "@unovis/ts": "1.6.4", "@unovis/vue": "1.6.4", "@vee-validate/zod": "^4.15.1", - "@vitejs/plugin-vue": "^6.0.5", + "@vitejs/plugin-vue": "^6.0.7", "@vitest/ui": "^3.2.4", - "@vue/test-utils": "^2.4.6", + "@vue/test-utils": "^2.4.10", "@vueuse/core": "^12.8.2", "@xterm/addon-fit": "^0.10.0", "@xterm/xterm": "^5.5.0", - "autoprefixer": "^10.4.23", + "autoprefixer": "^10.5.0", "class-variance-authority": "^0.7.1", "clsx": "^2.1.1", "cross-env": "^10.1.0", - "dayjs": "^1.11.19", - "electron": "^40.9.2", + "dayjs": "^1.11.20", + "electron": "^40.10.0", "electron-builder": "26.9.0", "electron-vite": "5.0.0", "jsdom": "^26.1.0", - "katex": "^0.16.27", + "katex": "^0.16.47", "lint-staged": "^16.4.0", "lucide-vue-next": "^0.544.0", "markstream-vue": "1.0.0-rc.0", - "mermaid": "^11.13.0", - "minimatch": "^10.2.4", + "mermaid": "^11.15.0", + "minimatch": "^10.2.5", "monaco-editor": "^0.55.1", "oxfmt": "^0.42.0", - "oxlint": "^1.57.0", + "oxlint": "^1.65.0", "picocolors": "^1.1.1", "pinia": "^3.0.4", - "reka-ui": "^2.9.2", + "reka-ui": "^2.9.7", "simple-git-hooks": "^2.13.1", "stream-monaco": "^0.0.40", - "tailwind-merge": "^3.5.0", + "tailwind-merge": "^3.6.0", "tailwind-scrollbar-hide": "^4.0.0", - "tailwindcss": "^4.2.2", + "tailwindcss": "^4.3.0", "tailwindcss-animate": "^1.0.7", + "taze": "^19.12.0", "tippy.js": "^6.3.7", "tw-animate-css": "^1.4.0", "typescript": "^5.9.3", "vee-validate": "^4.15.1", - "vite": "^7.3.1", + "vite": "^7.3.3", "vite-plugin-monaco-editor-esm": "^2.0.2", - "vite-plugin-vue-devtools": "^8.1.1", + "vite-plugin-vue-devtools": "^8.1.2", "vite-svg-loader": "^5.1.1", "vitest": "^3.2.4", - "vue": "^3.5.31", - "vue-i18n": "^11.3.0", + "vue": "^3.5.34", + "vue-i18n": "^11.4.4", "vue-router": "4", "vue-sonner": "^2.0.9", - "vue-tsgo": "0.0.1-yggdrasill.11", - "vue-virtual-scroller": "^3.0.0", + "vue-tsgo": "0.2.2", + "vue-virtual-scroller": "^3.0.3", "vuedraggable": "^4.1.0", - "yaml": "^2.8.3", - "zod-to-json-schema": "^3.25.1" + "yaml": "^2.9.0", + "zod-to-json-schema": "^3.25.2" }, "simple-git-hooks": { "pre-commit": "node scripts/pre-commit.mjs", diff --git a/resources/acp-registry/registry.json b/resources/acp-registry/registry.json index 7a4b51aab..759b3e401 100644 --- a/resources/acp-registry/registry.json +++ b/resources/acp-registry/registry.json @@ -61,7 +61,7 @@ { "id": "auggie", "name": "Auggie CLI", - "version": "0.26.0", + "version": "0.27.2", "description": "Augment Code's powerful software agent, backed by industry-leading context engine", "repository": "https://github.com/augmentcode/auggie", "website": "https://www.augmentcode.com/", @@ -72,7 +72,7 @@ "icon": "https://cdn.agentclientprotocol.com/registry/v1/latest/auggie.svg", "distribution": { "npx": { - "package": "@augmentcode/auggie@0.26.0", + "package": "@augmentcode/auggie@0.27.2", "args": [ "--acp" ], @@ -103,7 +103,7 @@ { "id": "claude-acp", "name": "Claude Agent", - "version": "0.33.1", + "version": "0.36.1", "description": "ACP wrapper for Anthropic's Claude", "repository": "https://github.com/agentclientprotocol/claude-agent-acp", "authors": [ @@ -114,7 +114,7 @@ "license": "proprietary", "distribution": { "npx": { - "package": "@agentclientprotocol/claude-agent-acp@0.33.1" + "package": "@agentclientprotocol/claude-agent-acp@0.36.1" } }, "icon": "https://cdn.agentclientprotocol.com/registry/v1/latest/claude-acp.svg" @@ -122,7 +122,7 @@ { "id": "cline", "name": "Cline", - "version": "2.18.0", + "version": "3.0.7", "description": "Autonomous coding agent CLI - capable of creating/editing files, running commands, using the browser, and more", "repository": "https://github.com/cline/cline", "website": "https://cline.bot/cli", @@ -133,7 +133,7 @@ "icon": "https://cdn.agentclientprotocol.com/registry/v1/latest/cline.svg", "distribution": { "npx": { - "package": "cline@2.18.0", + "package": "cline@3.0.7", "args": [ "--acp" ] @@ -143,7 +143,7 @@ { "id": "codebuddy-code", "name": "Codebuddy Code", - "version": "2.96.0", + "version": "2.97.3", "description": "Tencent Cloud's official intelligent coding tool", "website": "https://www.codebuddy.cn/cli/", "authors": [ @@ -152,7 +152,7 @@ "license": "Proprietary", "distribution": { "npx": { - "package": "@tencent-ai/codebuddy-code@2.96.0", + "package": "@tencent-ai/codebuddy-code@2.97.3", "args": [ "--acp" ] @@ -271,7 +271,7 @@ { "id": "corust-agent", "name": "Corust Agent", - "version": "0.5.1", + "version": "0.6.0", "description": "Co-building with a seasoned Rust partner.", "repository": "https://github.com/Corust-ai/corust-agent-release", "website": "https://corust.ai/", @@ -282,19 +282,19 @@ "distribution": { "binary": { "darwin-aarch64": { - "archive": "https://github.com/Corust-ai/corust-agent-release/releases/download/v0.5.1/agent-darwin-arm64.tar.gz", + "archive": "https://github.com/Corust-ai/corust-agent-release/releases/download/v0.6.0/agent-darwin-arm64.tar.gz", "cmd": "./corust-agent-acp" }, "darwin-x86_64": { - "archive": "https://github.com/Corust-ai/corust-agent-release/releases/download/v0.5.1/agent-darwin-x64.tar.gz", + "archive": "https://github.com/Corust-ai/corust-agent-release/releases/download/v0.6.0/agent-darwin-x64.tar.gz", "cmd": "./corust-agent-acp" }, "linux-x86_64": { - "archive": "https://github.com/Corust-ai/corust-agent-release/releases/download/v0.5.1/agent-linux-x64.tar.gz", + "archive": "https://github.com/Corust-ai/corust-agent-release/releases/download/v0.6.0/agent-linux-x64.tar.gz", "cmd": "./corust-agent-acp" }, "windows-x86_64": { - "archive": "https://github.com/Corust-ai/corust-agent-release/releases/download/v0.5.1/agent-windows-x64.zip", + "archive": "https://github.com/Corust-ai/corust-agent-release/releases/download/v0.6.0/agent-windows-x64.zip", "cmd": "./corust-agent-acp.exe" } } @@ -453,7 +453,7 @@ { "id": "dirac", "name": "Dirac", - "version": "0.3.41", + "version": "0.3.44", "description": "Reduces API costs by more than 50%, produces better and faster work. Uses Hash anchored parallel edits, AST manipulation and a whole lot of neat optimizations. Fully Open Source.", "repository": "https://github.com/dirac-run/dirac", "website": "https://dirac.run", @@ -464,7 +464,7 @@ "icon": "https://cdn.agentclientprotocol.com/registry/v1/latest/dirac.svg", "distribution": { "npx": { - "package": "dirac-cli@0.3.41", + "package": "dirac-cli@0.3.44", "args": [ "--acp" ] @@ -474,7 +474,7 @@ { "id": "factory-droid", "name": "Factory Droid", - "version": "0.122.0", + "version": "0.129.0", "description": "Factory Droid - AI coding agent powered by Factory AI", "website": "https://factory.ai/product/cli", "authors": [ @@ -483,7 +483,7 @@ "license": "proprietary", "distribution": { "npx": { - "package": "droid@0.122.0", + "package": "droid@0.129.0", "args": [ "exec", "--output-format", @@ -500,7 +500,7 @@ { "id": "fast-agent", "name": "fast-agent", - "version": "0.7.2", + "version": "0.7.6", "description": "Code and build agents with comprehensive multi-provider support", "repository": "https://github.com/evalstate/fast-agent", "website": "https://fast-agent.ai", @@ -510,7 +510,7 @@ "license": "Apache 2.0", "distribution": { "uvx": { - "package": "fast-agent-acp==0.7.2", + "package": "fast-agent-acp==0.7.6", "args": [ "-x" ] @@ -521,7 +521,7 @@ { "id": "gemini", "name": "Gemini CLI", - "version": "0.41.2", + "version": "0.42.0", "description": "Google's official CLI for Gemini", "repository": "https://github.com/google-gemini/gemini-cli", "website": "https://geminicli.com", @@ -531,7 +531,7 @@ "license": "Apache-2.0", "distribution": { "npx": { - "package": "@google/gemini-cli@0.41.2", + "package": "@google/gemini-cli@0.42.0", "args": [ "--acp" ] @@ -542,7 +542,7 @@ { "id": "github-copilot-cli", "name": "GitHub Copilot", - "version": "1.0.45", + "version": "1.0.49", "description": "GitHub's AI pair programmer", "repository": "https://github.com/github/copilot-cli", "website": "https://github.com/features/copilot/cli/", @@ -552,7 +552,7 @@ "license": "proprietary", "distribution": { "npx": { - "package": "@github/copilot@1.0.45", + "package": "@github/copilot@1.0.49", "args": [ "--acp" ] @@ -563,7 +563,7 @@ { "id": "glm-acp-agent", "name": "GLM Agent", - "version": "1.1.3", + "version": "1.1.4", "description": "ACP agent powered by Zhipu AI's GLM Coding Plan models (glm-5.1, glm-5-turbo, glm-4.7, glm-4.5-air). Supports streaming, tool calls, mid-session model switching, image input via Z.AI Coding Plan Vision MCP, and session load/fork/resume with on-disk persistence.", "repository": "https://github.com/stefandevo/glm-acp-agent", "authors": [ @@ -573,14 +573,14 @@ "icon": "https://cdn.agentclientprotocol.com/registry/v1/latest/glm-acp-agent.svg", "distribution": { "npx": { - "package": "glm-acp-agent@1.1.3" + "package": "glm-acp-agent@1.1.4" } } }, { "id": "goose", "name": "goose", - "version": "1.33.1", + "version": "1.34.1", "description": "A local, extensible, open source AI agent that automates engineering tasks", "repository": "https://github.com/block/goose", "website": "https://block.github.io/goose/", @@ -591,35 +591,35 @@ "distribution": { "binary": { "darwin-aarch64": { - "archive": "https://github.com/block/goose/releases/download/v1.33.1/goose-aarch64-apple-darwin.tar.bz2", + "archive": "https://github.com/block/goose/releases/download/v1.34.1/goose-aarch64-apple-darwin.tar.bz2", "cmd": "./goose", "args": [ "acp" ] }, "darwin-x86_64": { - "archive": "https://github.com/block/goose/releases/download/v1.33.1/goose-x86_64-apple-darwin.tar.bz2", + "archive": "https://github.com/block/goose/releases/download/v1.34.1/goose-x86_64-apple-darwin.tar.bz2", "cmd": "./goose", "args": [ "acp" ] }, "linux-aarch64": { - "archive": "https://github.com/block/goose/releases/download/v1.33.1/goose-aarch64-unknown-linux-gnu.tar.bz2", + "archive": "https://github.com/block/goose/releases/download/v1.34.1/goose-aarch64-unknown-linux-gnu.tar.bz2", "cmd": "./goose", "args": [ "acp" ] }, "linux-x86_64": { - "archive": "https://github.com/block/goose/releases/download/v1.33.1/goose-x86_64-unknown-linux-gnu.tar.bz2", + "archive": "https://github.com/block/goose/releases/download/v1.34.1/goose-x86_64-unknown-linux-gnu.tar.bz2", "cmd": "./goose", "args": [ "acp" ] }, "windows-x86_64": { - "archive": "https://github.com/block/goose/releases/download/v1.33.1/goose-x86_64-pc-windows-msvc.zip", + "archive": "https://github.com/block/goose/releases/download/v1.34.1/goose-x86_64-pc-windows-msvc.zip", "cmd": "./goose-package\\goose.exe", "args": [ "acp" @@ -632,7 +632,7 @@ { "id": "junie", "name": "Junie", - "version": "1543.24.0", + "version": "1588.20.0", "description": "AI Coding Agent by JetBrains", "repository": "https://github.com/JetBrains/junie", "website": "https://junie.jetbrains.com", @@ -643,35 +643,35 @@ "distribution": { "binary": { "darwin-aarch64": { - "archive": "https://github.com/JetBrains/junie/releases/download/1543.24/junie-release-1543.24-macos-aarch64.zip", + "archive": "https://github.com/JetBrains/junie/releases/download/1588.20/junie-release-1588.20-macos-aarch64.zip", "cmd": "./Applications/junie.app/Contents/MacOS/junie", "args": [ "--acp=true" ] }, "darwin-x86_64": { - "archive": "https://github.com/JetBrains/junie/releases/download/1543.24/junie-release-1543.24-macos-amd64.zip", + "archive": "https://github.com/JetBrains/junie/releases/download/1588.20/junie-release-1588.20-macos-amd64.zip", "cmd": "./Applications/junie.app/Contents/MacOS/junie", "args": [ "--acp=true" ] }, "linux-aarch64": { - "archive": "https://github.com/JetBrains/junie/releases/download/1543.24/junie-release-1543.24-linux-aarch64.zip", + "archive": "https://github.com/JetBrains/junie/releases/download/1588.20/junie-release-1588.20-linux-aarch64.zip", "cmd": "./junie-app/bin/junie", "args": [ "--acp=true" ] }, "linux-x86_64": { - "archive": "https://github.com/JetBrains/junie/releases/download/1543.24/junie-release-1543.24-linux-amd64.zip", + "archive": "https://github.com/JetBrains/junie/releases/download/1588.20/junie-release-1588.20-linux-amd64.zip", "cmd": "./junie-app/bin/junie", "args": [ "--acp=true" ] }, "windows-x86_64": { - "archive": "https://github.com/JetBrains/junie/releases/download/1543.24/junie-release-1543.24-windows-amd64.zip", + "archive": "https://github.com/JetBrains/junie/releases/download/1588.20/junie-release-1588.20-windows-amd64.zip", "cmd": "./junie/junie.exe", "args": [ "--acp=true" @@ -684,7 +684,7 @@ { "id": "kilo", "name": "Kilo", - "version": "7.2.52", + "version": "7.3.0", "description": "The open source coding agent", "repository": "https://github.com/Kilo-Org/kilocode", "website": "https://kilo.ai/", @@ -696,35 +696,35 @@ "distribution": { "binary": { "darwin-aarch64": { - "archive": "https://github.com/Kilo-Org/kilocode/releases/download/v7.2.52/kilo-darwin-arm64.zip", + "archive": "https://github.com/Kilo-Org/kilocode/releases/download/v7.3.0/kilo-darwin-arm64.zip", "cmd": "./kilo", "args": [ "acp" ] }, "darwin-x86_64": { - "archive": "https://github.com/Kilo-Org/kilocode/releases/download/v7.2.52/kilo-darwin-x64.zip", + "archive": "https://github.com/Kilo-Org/kilocode/releases/download/v7.3.0/kilo-darwin-x64.zip", "cmd": "./kilo", "args": [ "acp" ] }, "linux-aarch64": { - "archive": "https://github.com/Kilo-Org/kilocode/releases/download/v7.2.52/kilo-linux-arm64.tar.gz", + "archive": "https://github.com/Kilo-Org/kilocode/releases/download/v7.3.0/kilo-linux-arm64.tar.gz", "cmd": "./kilo", "args": [ "acp" ] }, "linux-x86_64": { - "archive": "https://github.com/Kilo-Org/kilocode/releases/download/v7.2.52/kilo-linux-x64.tar.gz", + "archive": "https://github.com/Kilo-Org/kilocode/releases/download/v7.3.0/kilo-linux-x64.tar.gz", "cmd": "./kilo", "args": [ "acp" ] }, "windows-x86_64": { - "archive": "https://github.com/Kilo-Org/kilocode/releases/download/v7.2.52/kilo-windows-x64.zip", + "archive": "https://github.com/Kilo-Org/kilocode/releases/download/v7.3.0/kilo-windows-x64.zip", "cmd": "./kilo.exe", "args": [ "acp" @@ -732,7 +732,7 @@ } }, "npx": { - "package": "@kilocode/cli@7.2.52", + "package": "@kilocode/cli@7.3.0", "args": [ "acp" ] @@ -742,7 +742,7 @@ { "id": "kimi", "name": "Kimi CLI", - "version": "1.42.0", + "version": "1.44.0", "description": "Moonshot AI's coding assistant", "repository": "https://github.com/MoonshotAI/kimi-cli", "website": "https://moonshotai.github.io/kimi-cli/", @@ -753,28 +753,28 @@ "distribution": { "binary": { "darwin-aarch64": { - "archive": "https://github.com/MoonshotAI/kimi-cli/releases/download/1.42.0/kimi-1.42.0-aarch64-apple-darwin.tar.gz", + "archive": "https://github.com/MoonshotAI/kimi-cli/releases/download/1.44.0/kimi-1.44.0-aarch64-apple-darwin.tar.gz", "cmd": "./kimi", "args": [ "acp" ] }, "linux-aarch64": { - "archive": "https://github.com/MoonshotAI/kimi-cli/releases/download/1.42.0/kimi-1.42.0-aarch64-unknown-linux-gnu.tar.gz", + "archive": "https://github.com/MoonshotAI/kimi-cli/releases/download/1.44.0/kimi-1.44.0-aarch64-unknown-linux-gnu.tar.gz", "cmd": "./kimi", "args": [ "acp" ] }, "linux-x86_64": { - "archive": "https://github.com/MoonshotAI/kimi-cli/releases/download/1.42.0/kimi-1.42.0-x86_64-unknown-linux-gnu.tar.gz", + "archive": "https://github.com/MoonshotAI/kimi-cli/releases/download/1.44.0/kimi-1.44.0-x86_64-unknown-linux-gnu.tar.gz", "cmd": "./kimi", "args": [ "acp" ] }, "windows-x86_64": { - "archive": "https://github.com/MoonshotAI/kimi-cli/releases/download/1.42.0/kimi-1.42.0-x86_64-pc-windows-msvc.zip", + "archive": "https://github.com/MoonshotAI/kimi-cli/releases/download/1.44.0/kimi-1.44.0-x86_64-pc-windows-msvc.zip", "cmd": "./kimi.exe", "args": [ "acp" @@ -848,7 +848,7 @@ { "id": "nova", "name": "Nova", - "version": "1.1.8", + "version": "1.1.9", "description": "Nova by Compass AI - a fully-fledged software engineer at your command", "repository": "https://github.com/Compass-Agentic-Platform/nova", "website": "https://www.compassap.ai/portfolio/nova.html", @@ -859,7 +859,7 @@ "icon": "https://cdn.agentclientprotocol.com/registry/v1/latest/nova.svg", "distribution": { "npx": { - "package": "@compass-ai/nova@1.1.8", + "package": "@compass-ai/nova@1.1.9", "args": [ "acp" ] @@ -869,7 +869,7 @@ { "id": "opencode", "name": "OpenCode", - "version": "1.14.48", + "version": "1.15.5", "description": "The open source coding agent", "repository": "https://github.com/anomalyco/opencode", "website": "https://opencode.ai", @@ -881,42 +881,42 @@ "distribution": { "binary": { "darwin-aarch64": { - "archive": "https://github.com/anomalyco/opencode/releases/download/v1.14.48/opencode-darwin-arm64.zip", + "archive": "https://github.com/anomalyco/opencode/releases/download/v1.15.5/opencode-darwin-arm64.zip", "cmd": "./opencode", "args": [ "acp" ] }, "darwin-x86_64": { - "archive": "https://github.com/anomalyco/opencode/releases/download/v1.14.48/opencode-darwin-x64.zip", + "archive": "https://github.com/anomalyco/opencode/releases/download/v1.15.5/opencode-darwin-x64.zip", "cmd": "./opencode", "args": [ "acp" ] }, "linux-aarch64": { - "archive": "https://github.com/anomalyco/opencode/releases/download/v1.14.48/opencode-linux-arm64.tar.gz", + "archive": "https://github.com/anomalyco/opencode/releases/download/v1.15.5/opencode-linux-arm64.tar.gz", "cmd": "./opencode", "args": [ "acp" ] }, "linux-x86_64": { - "archive": "https://github.com/anomalyco/opencode/releases/download/v1.14.48/opencode-linux-x64.tar.gz", + "archive": "https://github.com/anomalyco/opencode/releases/download/v1.15.5/opencode-linux-x64.tar.gz", "cmd": "./opencode", "args": [ "acp" ] }, "windows-aarch64": { - "archive": "https://github.com/anomalyco/opencode/releases/download/v1.14.48/opencode-windows-arm64.zip", + "archive": "https://github.com/anomalyco/opencode/releases/download/v1.15.5/opencode-windows-arm64.zip", "cmd": "./opencode", "args": [ "acp" ] }, "windows-x86_64": { - "archive": "https://github.com/anomalyco/opencode/releases/download/v1.14.48/opencode-windows-x64.zip", + "archive": "https://github.com/anomalyco/opencode/releases/download/v1.15.5/opencode-windows-x64.zip", "cmd": "./opencode.exe", "args": [ "acp" @@ -928,7 +928,7 @@ { "id": "pi-acp", "name": "pi ACP", - "version": "0.0.26", + "version": "0.0.27", "description": "ACP adapter for pi coding agent", "repository": "https://github.com/svkozak/pi-acp", "authors": [ @@ -937,7 +937,7 @@ "license": "MIT", "distribution": { "npx": { - "package": "pi-acp@0.0.26" + "package": "pi-acp@0.0.27" } }, "icon": "https://cdn.agentclientprotocol.com/registry/v1/latest/pi-acp.svg" @@ -1003,7 +1003,7 @@ { "id": "qoder", "name": "Qoder CLI", - "version": "0.2.12", + "version": "0.2.14", "description": "AI coding assistant with agentic capabilities", "website": "https://qoder.com", "authors": [ @@ -1013,7 +1013,7 @@ "icon": "https://cdn.agentclientprotocol.com/registry/v1/latest/qoder.svg", "distribution": { "npx": { - "package": "@qoder-ai/qodercli@0.2.12", + "package": "@qoder-ai/qodercli@0.2.14", "args": [ "--acp" ] @@ -1023,7 +1023,7 @@ { "id": "qwen-code", "name": "Qwen Code", - "version": "0.15.10", + "version": "0.15.11", "description": "Alibaba's Qwen coding assistant", "repository": "https://github.com/QwenLM/qwen-code", "website": "https://qwenlm.github.io/qwen-code-docs/en/users/overview", @@ -1033,7 +1033,7 @@ "license": "Apache-2.0", "distribution": { "npx": { - "package": "@qwen-code/qwen-code@0.15.10", + "package": "@qwen-code/qwen-code@0.15.11", "args": [ "--acp", "--experimental-skills" @@ -1089,7 +1089,7 @@ { "id": "stakpak", "name": "Stakpak", - "version": "0.3.80", + "version": "0.3.81", "description": "Open-source DevOps agent in Rust with enterprise-grade security", "repository": "https://github.com/stakpak/agent", "website": "https://stakpak.dev", @@ -1101,35 +1101,35 @@ "distribution": { "binary": { "darwin-aarch64": { - "archive": "https://github.com/stakpak/agent/releases/download/v0.3.80/stakpak-darwin-aarch64.tar.gz", + "archive": "https://github.com/stakpak/agent/releases/download/v0.3.81/stakpak-darwin-aarch64.tar.gz", "cmd": "./stakpak", "args": [ "acp" ] }, "darwin-x86_64": { - "archive": "https://github.com/stakpak/agent/releases/download/v0.3.80/stakpak-darwin-x86_64.tar.gz", + "archive": "https://github.com/stakpak/agent/releases/download/v0.3.81/stakpak-darwin-x86_64.tar.gz", "cmd": "./stakpak", "args": [ "acp" ] }, "linux-aarch64": { - "archive": "https://github.com/stakpak/agent/releases/download/v0.3.80/stakpak-linux-aarch64.tar.gz", + "archive": "https://github.com/stakpak/agent/releases/download/v0.3.81/stakpak-linux-aarch64.tar.gz", "cmd": "./stakpak", "args": [ "acp" ] }, "linux-x86_64": { - "archive": "https://github.com/stakpak/agent/releases/download/v0.3.80/stakpak-linux-x86_64.tar.gz", + "archive": "https://github.com/stakpak/agent/releases/download/v0.3.81/stakpak-linux-x86_64.tar.gz", "cmd": "./stakpak", "args": [ "acp" ] }, "windows-x86_64": { - "archive": "https://github.com/stakpak/agent/releases/download/v0.3.80/stakpak-windows-x86_64.zip", + "archive": "https://github.com/stakpak/agent/releases/download/v0.3.81/stakpak-windows-x86_64.zip", "cmd": "./stakpak.exe", "args": [ "acp" diff --git a/resources/model-db/providers.json b/resources/model-db/providers.json index 66f45867c..6cccbe57e 100644 --- a/resources/model-db/providers.json +++ b/resources/model-db/providers.json @@ -1,59 +1,52 @@ { "providers": { - "302ai": { - "id": "302ai", - "name": "302.AI", - "display_name": "302.AI", - "api": "https://api.302.ai/v1", - "doc": "https://doc.302.ai", + "helicone": { + "id": "helicone", + "name": "Helicone", + "display_name": "Helicone", + "api": "https://ai-gateway.helicone.ai/v1", + "doc": "https://helicone.ai/models", "models": [ { - "id": "qwen3-235b-a22b", - "name": "Qwen3-235B-A22B", - "display_name": "Qwen3-235B-A22B", + "id": "claude-opus-4-1-20250805", + "name": "Anthropic: Claude Opus 4.1 (20250805)", + "display_name": "Anthropic: Claude Opus 4.1 (20250805)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.29, - "output": 2.86 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "grok-4.1", - "name": "grok-4.1", - "display_name": "grok-4.1", + "id": "claude-3.7-sonnet", + "name": "Anthropic: Claude 3.7 Sonnet", + "display_name": "Anthropic: Claude 3.7 Sonnet", "modalities": { "input": [ "text", @@ -70,59 +63,79 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2025-02", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 2, - "output": 10 + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "MiniMax-M2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "mistral-small", + "name": "Mistral Small", + "display_name": "Mistral Small", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 128000, "output": 128000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-10-26", - "last_updated": "2025-10-26", + "knowledge": "2024-02", + "release_date": "2024-02-26", + "last_updated": "2024-02-26", "cost": { - "input": 0.33, - "output": 1.32 + "input": 75, + "output": 200 }, "type": "chat" }, { - "id": "grok-4-1-fast-reasoning", - "name": "grok-4-1-fast-reasoning", - "display_name": "grok-4-1-fast-reasoning", + "id": "chatgpt-4o-latest", + "name": "OpenAI ChatGPT-4o", + "display_name": "OpenAI ChatGPT-4o", "modalities": { "input": [ "text", @@ -133,127 +146,95 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-11-20", - "last_updated": "2025-11-20", + "knowledge": "2024-08", + "release_date": "2024-08-14", + "last_updated": "2024-08-14", "cost": { - "input": 0.2, - "output": 0.5 + "input": 5, + "output": 20, + "cache_read": 2.5 }, "type": "chat" }, { - "id": "gemini-2.5-flash-nothink", - "name": "gemini-2.5-flash-nothink", - "display_name": "gemini-2.5-flash-nothink", + "id": "kimi-k2-0905", + "name": "Kimi K2 (09/05)", + "display_name": "Kimi K2 (09/05)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-24", - "last_updated": "2025-06-24", + "knowledge": "2025-09", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.3, - "output": 2.5 + "input": 0.5, + "output": 2, + "cache_read": 0.39999999999999997 }, "type": "chat" }, { - "id": "grok-4.20-multi-agent-beta-0309", - "name": "grok-4.20-multi-agent-beta-0309", - "display_name": "grok-4.20-multi-agent-beta-0309", + "id": "gemma2-9b-it", + "name": "Google Gemma 2", + "display_name": "Google Gemma 2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "knowledge": "2024-06", + "release_date": "2024-06-25", + "last_updated": "2024-06-25", "cost": { - "input": 2, - "output": 6 + "input": 0.01, + "output": 0.03 }, "type": "chat" }, { - "id": "kimi-k2-0905-preview", - "name": "kimi-k2-0905-preview", - "display_name": "kimi-k2-0905-preview", + "id": "llama-3.1-8b-instant", + "name": "Meta Llama 3.1 8B Instant", + "display_name": "Meta Llama 3.1 8B Instant", "modalities": { "input": [ "text" @@ -263,8 +244,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 32678 }, "temperature": true, "tool_call": true, @@ -273,158 +254,131 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2024-07", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.632, - "output": 2.53 + "input": 0.049999999999999996, + "output": 0.08 }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "claude-haiku-4-5", - "display_name": "claude-haiku-4-5", + "id": "mistral-large-2411", + "name": "Mistral-Large", + "display_name": "Mistral-Large", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-16", - "last_updated": "2025-10-16", + "knowledge": "2024-07", + "release_date": "2024-07-24", + "last_updated": "2024-07-24", "cost": { - "input": 1, - "output": 5 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "claude-opus-4-5-20251101", - "name": "claude-opus-4-5-20251101", - "display_name": "claude-opus-4-5-20251101", + "id": "gpt-4o", + "name": "OpenAI GPT-4o", + "display_name": "OpenAI GPT-4o", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-25", - "last_updated": "2025-11-25", + "knowledge": "2024-05", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 5, - "output": 25 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-09-2025", - "name": "gemini-2.5-flash-lite-preview-09-2025", - "display_name": "gemini-2.5-flash-lite-preview-09-2025", + "id": "qwen3-vl-235b-a22b-instruct", + "name": "Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen3 VL 235B A22B Instruct", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-26", - "last_updated": "2025-09-26", + "knowledge": "2025-09", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.3, + "output": 1.5 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "qwen3-235b-a22b-instruct-2507", - "display_name": "qwen3-235b-a22b-instruct-2507", + "id": "claude-3-haiku-20240307", + "name": "Anthropic: Claude 3 Haiku", + "display_name": "Anthropic: Claude 3 Haiku", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -433,112 +387,100 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "knowledge": "2024-03", + "release_date": "2024-03-07", + "last_updated": "2024-03-07", "cost": { - "input": 0.29, - "output": 1.143 + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "glm-5v-turbo", - "name": "GLM-5V-Turbo", - "display_name": "GLM-5V-Turbo", + "id": "sonar-reasoning", + "name": "Perplexity Sonar Reasoning", + "display_name": "Perplexity Sonar Reasoning", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 127000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0.72, - "output": 3.2 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "mistral-large-2512", - "name": "mistral-large-2512", - "display_name": "mistral-large-2512", + "id": "llama-prompt-guard-2-22m", + "name": "Meta Llama Prompt Guard 2 22M", + "display_name": "Meta Llama Prompt Guard 2 22M", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 262144 + "context": 512, + "output": 2 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 1.1, - "output": 3.3 + "input": 0.01, + "output": 0.01 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "glm-4.7", - "display_name": "glm-4.7", + "id": "o3-pro", + "name": "OpenAI o3 Pro", + "display_name": "OpenAI o3 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -547,34 +489,36 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.286, - "output": 1.142 + "input": 20, + "output": 80 }, "type": "chat" }, { - "id": "claude-3-5-haiku-20241022", - "name": "claude-3-5-haiku-20241022", - "display_name": "claude-3-5-haiku-20241022", + "id": "claude-haiku-4-5-20251001", + "name": "Anthropic: Claude 4.5 Haiku (20251001)", + "display_name": "Anthropic: Claude 4.5 Haiku (20251001)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -589,21 +533,23 @@ "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2025-10", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", "cost": { - "input": 0.8, - "output": 4 + "input": 1, + "output": 5, + "cache_read": 0.09999999999999999, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "doubao-seed-1-8-251215", - "name": "doubao-seed-1-8-251215", - "display_name": "doubao-seed-1-8-251215", + "id": "gpt-4.1-mini-2025-04-14", + "name": "OpenAI GPT-4.1 Mini", + "display_name": "OpenAI GPT-4.1 Mini", "modalities": { "input": [ "text", @@ -614,28 +560,30 @@ ] }, "limit": { - "context": 224000, - "output": 64000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-18", - "last_updated": "2025-12-18", + "knowledge": "2025-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.114, - "output": 0.286 + "input": 0.39999999999999997, + "output": 1.5999999999999999, + "cache_read": 0.09999999999999999 }, "type": "chat" }, { - "id": "chatgpt-4o-latest", - "name": "chatgpt-4o-latest", - "display_name": "chatgpt-4o-latest", + "id": "gemini-2.5-pro", + "name": "Google Gemini 2.5 Pro", + "display_name": "Google Gemini 2.5 Pro", "modalities": { "input": [ "text", @@ -646,40 +594,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-08-08", - "last_updated": "2024-08-08", - "cost": { - "input": 5, - "output": 15 - }, - "type": "chat" - }, - { - "id": "glm-5", - "name": "glm-5", - "display_name": "glm-5", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 204800, - "output": 131072 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -690,31 +606,43 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.6, - "output": 2.6 + "input": 1.25, + "output": 10, + "cache_read": 0.3125, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "deepseek-chat", - "name": "Deepseek-Chat", - "display_name": "Deepseek-Chat", + "id": "gpt-5-chat-latest", + "name": "OpenAI GPT-5 Chat Latest", + "display_name": "OpenAI GPT-5 Chat Latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -722,28 +650,29 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-11-29", - "last_updated": "2024-11-29", + "knowledge": "2024-09", + "release_date": "2024-09-30", + "last_updated": "2024-09-30", "cost": { - "input": 0.29, - "output": 0.43 + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 }, "type": "chat" }, { - "id": "deepseek-v3.2-thinking", - "name": "DeepSeek-V3.2-Thinking", - "display_name": "DeepSeek-V3.2-Thinking", + "id": "grok-3-mini", + "name": "xAI Grok 3 Mini", + "display_name": "xAI Grok 3 Mini", "modalities": { "input": [ "text" @@ -753,45 +682,45 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.29, - "output": 0.43 + "input": 0.3, + "output": 0.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "claude-sonnet-4-6", - "display_name": "claude-sonnet-4-6", + "id": "gpt-5.1-codex-mini", + "name": "OpenAI: GPT-5.1 Codex Mini", + "display_name": "OpenAI: GPT-5.1 Codex Mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -801,43 +730,39 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", + "mode": "effort", + "effort": "none", "effort_options": [ + "none", "low", "medium", "high" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-18", - "last_updated": "2026-03-13", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 3, - "output": 15 + "input": 0.25, + "output": 2, + "cache_read": 0.024999999999999998 }, "type": "chat" }, { - "id": "gpt-5-thinking", - "name": "gpt-5-thinking", - "display_name": "gpt-5-thinking", + "id": "grok-4-1-fast-reasoning", + "name": "xAI Grok 4.1 Fast Reasoning", + "display_name": "xAI Grok 4.1 Fast Reasoning", "modalities": { "input": [ "text", @@ -848,8 +773,8 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, @@ -857,21 +782,27 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "knowledge": "2025-11", + "release_date": "2025-11-17", + "last_updated": "2025-11-17", "cost": { - "input": 1.25, - "output": 10 + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 }, "type": "chat" }, { - "id": "glm-4.7-flashx", - "name": "glm-4.7-flashx", - "display_name": "glm-4.7-flashx", + "id": "kimi-k2-0711", + "name": "Kimi K2 (07/11)", + "display_name": "Kimi K2 (07/11)", "modalities": { "input": [ "text" @@ -881,285 +812,203 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-20", - "last_updated": "2026-01-20", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.0715, - "output": 0.429 + "input": 0.5700000000000001, + "output": 2.3 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "gemini-3-flash-preview", - "display_name": "gemini-3-flash-preview", + "id": "deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 163840, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-12-18", - "last_updated": "2025-12-18", + "knowledge": "2025-09", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 0.5, - "output": 3 + "input": 0.27, + "output": 0.41 }, "type": "chat" }, { - "id": "qwen-plus", - "name": "Qwen-Plus", - "display_name": "Qwen-Plus", + "id": "grok-4-1-fast-non-reasoning", + "name": "xAI Grok 4.1 Fast Non-Reasoning", + "display_name": "xAI Grok 4.1 Fast Non-Reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2025-11", + "release_date": "2025-11-17", + "last_updated": "2025-11-17", "cost": { - "input": 0.12, - "output": 1.2 + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 }, "type": "chat" }, { - "id": "grok-4.20-beta-0309-non-reasoning", - "name": "grok-4.20-beta-0309-non-reasoning", - "display_name": "grok-4.20-beta-0309-non-reasoning", + "id": "qwen2.5-coder-7b-fast", + "name": "Qwen2.5 Coder 7B fast", + "display_name": "Qwen2.5 Coder 7B fast", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 32000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "knowledge": "2024-09", + "release_date": "2024-09-15", + "last_updated": "2024-09-15", "cost": { - "input": 2, - "output": 6 + "input": 0.03, + "output": 0.09 }, "type": "chat" }, { - "id": "claude-opus-4-7", - "name": "claude-opus-4-7", - "display_name": "claude-opus-4-7", + "id": "grok-4", + "name": "xAI Grok 4", + "display_name": "xAI Grok 4", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "knowledge": "2024-07", + "release_date": "2024-07-09", + "last_updated": "2024-07-09", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25, - "context_over_200k": { - "input": 10, - "output": 37.5, - "cache_read": 1, - "cache_write": 12.5 - } + "input": 3, + "output": 15, + "cache_read": 0.75 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "gpt-5-mini", - "display_name": "gpt-5-mini", + "id": "sonar", + "name": "Perplexity Sonar", + "display_name": "Perplexity Sonar", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 127000, + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0.25, - "output": 2 + "input": 1, + "output": 1 }, "type": "chat" }, { - "id": "gemini-3-pro-preview", - "name": "gemini-3-pro-preview", - "display_name": "gemini-3-pro-preview", + "id": "mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text", @@ -1170,47 +1019,29 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 16400 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 2, - "output": 12 + "input": 20, + "output": 40 }, "type": "chat" }, { - "id": "MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "grok-code-fast-1", + "name": "xAI Grok Code Fast 1", + "display_name": "xAI Grok Code Fast 1", "modalities": { "input": [ "text" @@ -1220,8 +1051,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 256000, + "output": 10000 }, "temperature": true, "tool_call": true, @@ -1230,29 +1061,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": false, - "release_date": "2026-03-19", - "last_updated": "2026-03-19", + "knowledge": "2024-08", + "release_date": "2024-08-25", + "last_updated": "2024-08-25", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.19999999999999998, + "output": 1.5, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "qwen3-max-2025-09-23", - "name": "qwen3-max-2025-09-23", - "display_name": "qwen3-max-2025-09-23", + "id": "deepseek-v3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ "text" @@ -1262,8 +1089,8 @@ ] }, "limit": { - "context": 258048, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -1272,54 +1099,20 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-24", - "last_updated": "2025-09-24", - "cost": { - "input": 0.86, - "output": 3.43 - }, - "type": "chat" - }, - { - "id": "claude-sonnet-4-5-20250929", - "name": "claude-sonnet-4-5-20250929", - "display_name": "claude-sonnet-4-5-20250929", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 64000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2024-12", + "release_date": "2024-12-26", + "last_updated": "2024-12-26", "cost": { - "input": 3, - "output": 15 + "input": 0.56, + "output": 1.68, + "cache_read": 0.07 }, "type": "chat" }, { - "id": "qwen-flash", - "name": "Qwen-Flash", - "display_name": "Qwen-Flash", + "id": "gpt-5-codex", + "name": "OpenAI: GPT-5 Codex", + "display_name": "OpenAI: GPT-5 Codex", "modalities": { "input": [ "text" @@ -1329,53 +1122,10 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", - "cost": { - "input": 0.022, - "output": 0.22 - }, - "type": "chat" - }, - { - "id": "gemini-2.5-pro", - "name": "gemini-2.5-pro", - "display_name": "gemini-2.5-pro", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -1385,74 +1135,78 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { "input": 1.25, - "output": 10 + "output": 10, + "cache_read": 0.12500000000000003 }, "type": "chat" }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "grok-4-1-fast-non-reasoning", - "display_name": "grok-4-1-fast-non-reasoning", + "id": "gpt-5.1-chat-latest", + "name": "OpenAI GPT-5.1 Chat", + "display_name": "OpenAI GPT-5.1 Chat", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-11-20", - "last_updated": "2025-11-20", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.2, - "output": 0.5 + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 }, "type": "chat" }, { - "id": "claude-3-5-haiku-latest", - "name": "claude-3-5-haiku-latest", - "display_name": "claude-3-5-haiku-latest", + "id": "claude-4.5-haiku", + "name": "Anthropic: Claude 4.5 Haiku", + "display_name": "Anthropic: Claude 4.5 Haiku", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -1467,21 +1221,23 @@ "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2025-10", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", "cost": { - "input": 0.8, - "output": 4 + "input": 1, + "output": 5, + "cache_read": 0.09999999999999999, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "claude-opus-4-5-20251101-thinking", - "name": "claude-opus-4-5-20251101-thinking", - "display_name": "claude-opus-4-5-20251101-thinking", + "id": "gpt-4.1", + "name": "OpenAI GPT-4.1", + "display_name": "OpenAI GPT-4.1", "modalities": { "input": [ "text", @@ -1492,148 +1248,100 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-11-25", - "last_updated": "2025-11-25", + "knowledge": "2025-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 5, - "output": 25 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "gpt-5.2", - "name": "gpt-5.2", - "display_name": "gpt-5.2", + "id": "glm-4.6", + "name": "Zai GLM-4.6", + "display_name": "Zai GLM-4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-12", - "last_updated": "2025-12-12", + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 1.75, - "output": 14 + "input": 0.44999999999999996, + "output": 1.5 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "gpt-5.4-mini", - "display_name": "gpt-5.4-mini", + "id": "llama-3.3-70b-versatile", + "name": "Meta Llama 3.3 70B Versatile", + "display_name": "Meta Llama 3.3 70B Versatile", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 32678 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-19", - "last_updated": "2026-03-19", + "knowledge": "2024-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.75, - "output": 4.5 + "input": 0.59, + "output": 0.7899999999999999 }, "type": "chat" }, { - "id": "gemini-3-pro-image-preview", - "name": "gemini-3-pro-image-preview", - "display_name": "gemini-3-pro-image-preview", + "id": "claude-opus-4", + "name": "Anthropic: Claude Opus 4", + "display_name": "Anthropic: Claude Opus 4", "modalities": { "input": [ "text", @@ -1644,47 +1352,32 @@ ] }, "limit": { - "context": 32768, - "output": 64000 + "context": 200000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-11-20", - "last_updated": "2025-11-20", + "knowledge": "2025-05", + "release_date": "2025-05-14", + "last_updated": "2025-05-14", "cost": { - "input": 2, - "output": 120 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "glm-5.1", - "name": "glm-5.1", - "display_name": "glm-5.1", + "id": "gpt-oss-20b", + "name": "OpenAI GPT-OSS 20b", + "display_name": "OpenAI GPT-OSS 20b", "modalities": { "input": [ "text" @@ -1694,7 +1387,7 @@ ] }, "limit": { - "context": 200000, + "context": 131072, "output": 131072 }, "temperature": true, @@ -1705,93 +1398,84 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": false, - "release_date": "2026-04-10", - "last_updated": "2026-04-10", + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.86, - "output": 3.5 + "input": 0.049999999999999996, + "output": 0.19999999999999998 }, "type": "chat" }, { - "id": "qwen-max-latest", - "name": "Qwen-Max-Latest", - "display_name": "Qwen-Max-Latest", + "id": "claude-4.5-sonnet", + "name": "Anthropic: Claude Sonnet 4.5", + "display_name": "Anthropic: Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2024-04-03", - "last_updated": "2025-01-25", + "knowledge": "2025-09", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.343, - "output": 1.372 + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gpt-5.4-nano", - "name": "gpt-5.4-nano", - "display_name": "gpt-5.4-nano", + "id": "gpt-5-pro", + "name": "OpenAI: GPT-5 Pro", + "display_name": "OpenAI: GPT-5 Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 32768 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], + "default_enabled": true, + "mode": "fixed", + "effort": "high", "verbosity": "medium", "verbosity_options": [ "low", @@ -1801,197 +1485,166 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-19", - "last_updated": "2026-03-19", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.2, - "output": 1.25 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "gemini-2.5-flash-image", - "name": "gemini-2.5-flash-image", - "display_name": "gemini-2.5-flash-image", + "id": "deepseek-reasoner", + "name": "DeepSeek Reasoner", + "display_name": "DeepSeek Reasoner", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-10-08", - "last_updated": "2025-10-08", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.3, - "output": 30 + "input": 0.56, + "output": 1.68, + "cache_read": 0.07 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "gpt-4.1-mini", + "name": "OpenAI GPT-4.1 Mini", + "display_name": "OpenAI GPT-4.1 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, + "open_weights": false, "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.286, - "output": 1.142 + "input": 0.39999999999999997, + "output": 1.5999999999999999, + "cache_read": 0.09999999999999999 }, "type": "chat" }, { - "id": "gpt-5.4-mini-2026-03-17", - "name": "gpt-5.4-mini-2026-03-17", - "display_name": "gpt-5.4-mini-2026-03-17", + "id": "qwen3-coder", + "name": "Qwen3 Coder 480B A35B Instruct Turbo", + "display_name": "Qwen3 Coder 480B A35B Instruct Turbo", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-19", - "last_updated": "2026-03-19", + "knowledge": "2025-07", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.75, - "output": 4.5 + "input": 0.22, + "output": 0.95 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "gemini-2.5-flash", - "display_name": "gemini-2.5-flash", + "id": "llama-3.1-8b-instruct-turbo", + "name": "Meta Llama 3.1 8B Instruct Turbo", + "display_name": "Meta Llama 3.1 8B Instruct Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2024-07", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.3, - "output": 2.5 + "input": 0.02, + "output": 0.03 }, "type": "chat" }, { - "id": "gpt-5.2-chat-latest", - "name": "gpt-5.2-chat-latest", - "display_name": "gpt-5.2-chat-latest", + "id": "claude-opus-4-1", + "name": "Anthropic: Claude Opus 4.1", + "display_name": "Anthropic: Claude Opus 4.1", "modalities": { "input": [ "text", @@ -2002,30 +1655,37 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-12", - "last_updated": "2025-12-12", + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.75, - "output": 14 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "doubao-seed-1-6-vision-250815", - "name": "doubao-seed-1-6-vision-250815", - "display_name": "doubao-seed-1-6-vision-250815", + "id": "claude-4.5-opus", + "name": "Anthropic: Claude Opus 4.5", + "display_name": "Anthropic: Claude Opus 4.5", "modalities": { "input": [ "text", @@ -2036,178 +1696,231 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2025-11", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.114, - "output": 1.143 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "gemini-3.1-flash-image-preview", - "name": "gemini-3.1-flash-image-preview", - "display_name": "gemini-3.1-flash-image-preview", + "id": "sonar-deep-research", + "name": "Perplexity Sonar Deep Research", + "display_name": "Perplexity Sonar Deep Research", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 127000, + "output": 4096 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2025-01", - "release_date": "2026-02-27", - "last_updated": "2026-02-27", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0.5, - "output": 60 + "input": 2, + "output": 8 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "MiniMax-M2.7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "gemini-2.5-flash-lite", + "name": "Google Gemini 2.5 Flash Lite", + "display_name": "Google Gemini 2.5 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": false, "open_weights": false, - "release_date": "2026-03-19", - "last_updated": "2026-03-19", + "knowledge": "2025-07", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", "cost": { - "input": 0.6, - "output": 4.8 + "input": 0.09999999999999999, + "output": 0.39999999999999997, + "cache_read": 0.024999999999999998, + "cache_write": 0.09999999999999999 }, "type": "chat" }, { - "id": "glm-4.5-x", - "name": "glm-4.5-x", - "display_name": "glm-4.5-x", + "id": "gemini-3-pro-preview", + "name": "Google Gemini 3 Pro Preview", + "display_name": "Google Gemini 3 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "knowledge": "2025-11", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 1.143, - "output": 2.29 + "input": 2, + "output": 12, + "cache_read": 0.19999999999999998 }, "type": "chat" }, { - "id": "MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "gpt-5.1", + "name": "OpenAI GPT-5.1", + "display_name": "OpenAI GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, "open_weights": false, - "release_date": "2025-12-19", - "last_updated": "2025-12-19", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.3, - "output": 1.2 + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "gpt-5.1", - "display_name": "gpt-5.1", + "id": "gpt-5-nano", + "name": "OpenAI GPT-5 Nano", + "display_name": "OpenAI GPT-5 Nano", "modalities": { "input": [ "text", @@ -2225,16 +1938,16 @@ "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", + "minimal", "low", "medium", "high" @@ -2248,54 +1961,56 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.25, - "output": 10 + "input": 0.049999999999999996, + "output": 0.39999999999999997, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "kimi-k2-thinking-turbo", - "name": "kimi-k2-thinking-turbo", - "display_name": "kimi-k2-thinking-turbo", + "id": "gpt-4o-mini", + "name": "OpenAI GPT-4o-mini", + "display_name": "OpenAI GPT-4o-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 1.265, - "output": 9.119 + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "deepseek-reasoner", - "name": "Deepseek-Reasoner", - "display_name": "Deepseek-Reasoner", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ "text" @@ -2305,8 +2020,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 40960 }, "temperature": true, "tool_call": true, @@ -2327,58 +2042,62 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { "input": 0.29, - "output": 0.43 + "output": 0.59 }, "type": "chat" }, { - "id": "grok-4-fast-reasoning", - "name": "grok-4-fast-reasoning", - "display_name": "grok-4-fast-reasoning", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 256000, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "knowledge": "2025-11", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.48, + "output": 2 }, "type": "chat" }, { - "id": "claude-opus-4-1-20250805-thinking", - "name": "claude-opus-4-1-20250805-thinking", - "display_name": "claude-opus-4-1-20250805-thinking", + "id": "llama-4-scout", + "name": "Meta Llama 4 Scout 17B 16E", + "display_name": "Meta Llama 4 Scout 17B 16E", "modalities": { "input": [ "text", @@ -2389,36 +2108,29 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-05-27", - "last_updated": "2025-05-27", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 15, - "output": 75 + "input": 0.08, + "output": 0.3 }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "glm-4.5-air", - "display_name": "glm-4.5-air", + "id": "llama-prompt-guard-2-86m", + "name": "Meta Llama Prompt Guard 2 86M", + "display_name": "Meta Llama Prompt Guard 2 86M", "modalities": { "input": [ "text" @@ -2428,30 +2140,29 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 512, + "output": 2 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 0.1143, - "output": 0.286 + "input": 0.01, + "output": 0.01 }, "type": "chat" }, { - "id": "gpt-5.4-pro", - "name": "gpt-5.4-pro", - "display_name": "gpt-5.4-pro", + "id": "claude-sonnet-4-5-20250929", + "name": "Anthropic: Claude Sonnet 4.5 (20250929)", + "display_name": "Anthropic: Claude Sonnet 4.5 (20250929)", "modalities": { "input": [ "text", @@ -2462,59 +2173,36 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2025-09", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 30, - "output": 180, - "cache_read": 0, - "cache_write": 0, - "context_over_200k": { - "input": 60, - "output": 270 - } + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "glm-5-turbo", - "name": "glm-5-turbo", - "display_name": "glm-5-turbo", + "id": "claude-3.5-sonnet-v2", + "name": "Anthropic: Claude 3.5 Sonnet v2", + "display_name": "Anthropic: Claude 3.5 Sonnet v2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -2522,50 +2210,42 @@ }, "limit": { "context": 200000, - "output": 131072 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "knowledge": "2024-10", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.72, - "output": 3.2 + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 }, "type": "chat" }, { "id": "qwen3-30b-a3b", - "name": "Qwen3-30B-A3B", - "display_name": "Qwen3-30B-A3B", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 41000, + "output": 41000 }, "temperature": true, "tool_call": true, @@ -2585,24 +2265,22 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "knowledge": "2025-06", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 0.11, - "output": 1.08 + "input": 0.08, + "output": 0.29 }, "type": "chat" }, { - "id": "claude-opus-4-5", - "name": "claude-opus-4-5", - "display_name": "claude-opus-4-5", + "id": "o1", + "name": "OpenAI: o1", + "display_name": "OpenAI: o1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -2610,69 +2288,77 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 100000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-25", - "last_updated": "2025-11-25", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 5, - "output": 25 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "glm-4.5v", - "name": "GLM-4.5V", - "display_name": "GLM-4.5V", + "id": "ernie-4.5-21b-a3b-thinking", + "name": "Baidu Ernie 4.5 21B A3B Thinking", + "display_name": "Baidu Ernie 4.5 21B A3B Thinking", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 128000, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-12", - "last_updated": "2025-08-12", + "attachment": false, + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-03-16", + "last_updated": "2025-03-16", "cost": { - "input": 0.29, - "output": 0.86 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "glm-4.6", - "name": "glm-4.6", - "display_name": "glm-4.6", + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ "text" @@ -2682,8 +2368,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -2697,33 +2383,32 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.286, - "output": 1.142 + "input": 0.03, + "output": 0.13 }, "type": "chat" }, { - "id": "claude-opus-4-6-thinking", - "name": "claude-opus-4-6-thinking", - "display_name": "claude-opus-4-6-thinking", + "id": "claude-sonnet-4", + "name": "Anthropic: Claude Sonnet 4", + "display_name": "Anthropic: Claude Sonnet 4", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -2731,267 +2416,181 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2025-05", - "release_date": "2026-02-06", - "last_updated": "2026-03-13", + "release_date": "2025-05-14", + "last_updated": "2025-05-14", "cost": { - "input": 5, - "output": 25 + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-09-2025", - "name": "gemini-2.5-flash-preview-09-2025", - "display_name": "gemini-2.5-flash-preview-09-2025", + "id": "sonar-reasoning-pro", + "name": "Perplexity Sonar Reasoning Pro", + "display_name": "Perplexity Sonar Reasoning Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 127000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-09-26", - "last_updated": "2025-09-26", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0.3, - "output": 2.5 + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "claude-sonnet-4-6-thinking", - "name": "claude-sonnet-4-6-thinking", - "display_name": "claude-sonnet-4-6-thinking", + "id": "deepseek-tng-r1t2-chimera", + "name": "DeepSeek TNG R1T2 Chimera", + "display_name": "DeepSeek TNG R1T2 Chimera", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 130000, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08", - "release_date": "2026-02-18", - "last_updated": "2026-03-13", + "knowledge": "2025-07", + "release_date": "2025-07-02", + "last_updated": "2025-07-02", "cost": { - "input": 3, - "output": 15 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "glm-4.6v", - "name": "GLM-4.6V", - "display_name": "GLM-4.6V", + "id": "gpt-4.1-nano", + "name": "OpenAI GPT-4.1 Nano", + "display_name": "OpenAI GPT-4.1 Nano", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 1047576, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": true, + "attachment": false, + "open_weights": false, "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.145, - "output": 0.43 + "input": 0.09999999999999999, + "output": 0.39999999999999997, + "cache_read": 0.024999999999999998 }, "type": "chat" }, { - "id": "claude-opus-4-1-20250805", - "name": "claude-opus-4-1-20250805", - "display_name": "claude-opus-4-1-20250805", + "id": "gemma-3-12b-it", + "name": "Google Gemma 3 12B", + "display_name": "Google Gemma 3 12B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 15, - "output": 75 + "input": 0.049999999999999996, + "output": 0.09999999999999999 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "gpt-5.4", - "display_name": "gpt-5.4", + "id": "o4-mini", + "name": "OpenAI o4 Mini", + "display_name": "OpenAI o4 Mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -2999,74 +2598,91 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "cache_write": 0, - "context_over_200k": { - "input": 5, - "output": 22.5 - } + "input": 1.1, + "output": 4.4, + "cache_read": 0.275 }, "type": "chat" }, { - "id": "gpt-5.1-chat-latest", - "name": "gpt-5.1-chat-latest", - "display_name": "gpt-5.1-chat-latest", + "id": "gpt-5.1-codex", + "name": "OpenAI: GPT-5.1 Codex", + "display_name": "OpenAI: GPT-5.1 Codex", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { "input": 1.25, - "output": 10 + "output": 10, + "cache_read": 0.12500000000000003 }, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "claude-haiku-4-5-20251001", - "display_name": "claude-haiku-4-5-20251001", + "id": "gemini-2.5-flash", + "name": "Google Gemini 2.5 Flash", + "display_name": "Google Gemini 2.5 Flash", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -3074,86 +2690,124 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-16", - "last_updated": "2025-10-16", + "knowledge": "2025-06", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 1, - "output": 5 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "MiniMax-M1", - "name": "MiniMax-M1", - "display_name": "MiniMax-M1", + "id": "gpt-5-mini", + "name": "OpenAI GPT-5 Mini", + "display_name": "OpenAI GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2025-06-16", - "last_updated": "2025-06-16", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.132, - "output": 1.254 + "input": 0.25, + "output": 2, + "cache_read": 0.024999999999999998 }, "type": "chat" }, { - "id": "gpt-5.4-nano-2026-03-17", - "name": "gpt-5.4-nano-2026-03-17", - "display_name": "gpt-5.4-nano-2026-03-17", + "id": "o3-mini", + "name": "OpenAI o3 Mini", + "display_name": "OpenAI o3 Mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -3161,56 +2815,55 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-19", - "last_updated": "2026-03-19", + "knowledge": "2023-10", + "release_date": "2023-10-01", + "last_updated": "2023-10-01", "cost": { - "input": 0.2, - "output": 1.25 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "claude-sonnet-4-20250514", - "name": "claude-sonnet-4-20250514", - "display_name": "claude-sonnet-4-20250514", + "id": "llama-4-maverick", + "name": "Meta Llama 4 Maverick 17B 128E", + "display_name": "Meta Llama 4 Maverick 17B 128E", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 3, - "output": 15 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "qwen3-coder-480b-a35b-instruct", - "display_name": "qwen3-coder-480b-a35b-instruct", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ "text" @@ -3221,7 +2874,7 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 262144 }, "temperature": true, "tool_call": true, @@ -3230,112 +2883,85 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "knowledge": "2025-07", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "cost": { - "input": 0.86, - "output": 3.43 + "input": 0.09999999999999999, + "output": 0.3 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "claude-opus-4-6", - "display_name": "claude-opus-4-6", + "id": "llama-3.3-70b-instruct", + "name": "Meta Llama 3.3 70B Instruct", + "display_name": "Meta Llama 3.3 70B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 128000, + "output": 16400 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-06", - "last_updated": "2026-03-13", + "knowledge": "2024-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 5, - "output": 25 + "input": 0.13, + "output": 0.39 }, "type": "chat" }, { - "id": "doubao-seed-code-preview-251028", - "name": "doubao-seed-code-preview-251028", - "display_name": "doubao-seed-code-preview-251028", + "id": "qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 262000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-11", - "last_updated": "2025-11-11", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.17, - "output": 1.14 + "input": 0.14, + "output": 1.4 }, "type": "chat" }, { - "id": "gpt-4.1-nano", - "name": "gpt-4.1-nano", - "display_name": "gpt-4.1-nano", + "id": "claude-3.5-haiku", + "name": "Anthropic: Claude 3.5 Haiku", + "display_name": "Anthropic: Claude 3.5 Haiku", "modalities": { "input": [ "text", @@ -3346,29 +2972,31 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-10", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.7999999999999999, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "deepseek-v3.2", - "display_name": "deepseek-v3.2", + "id": "gpt-oss-120b", + "name": "OpenAI GPT-OSS 120b", + "display_name": "OpenAI GPT-OSS 120b", "modalities": { "input": [ "text" @@ -3378,13 +3006,14 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -3393,34 +3022,35 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.29, - "output": 0.43 + "input": 0.04, + "output": 0.16 }, "type": "chat" }, { - "id": "gpt-5-pro", - "name": "gpt-5-pro", - "display_name": "gpt-5-pro", + "id": "qwen3-235b-a22b-thinking", + "name": "Qwen3 235B A22B Thinking", + "display_name": "Qwen3 235B A22B Thinking", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 272000 + "context": 262144, + "output": 81920 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -3428,72 +3058,65 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-08", - "last_updated": "2025-10-08", + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 15, - "output": 120 + "input": 0.3, + "output": 2.9000000000000004 }, "type": "chat" }, { - "id": "gpt-4o", - "name": "gpt-4o", - "display_name": "gpt-4o", + "id": "hermes-2-pro-llama-3-8b", + "name": "Hermes 2 Pro Llama 3 8B", + "display_name": "Hermes 2 Pro Llama 3 8B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "knowledge": "2024-05", + "release_date": "2024-05-27", + "last_updated": "2024-05-27", "cost": { - "input": 2.5, - "output": 10 + "input": 0.14, + "output": 0.14 }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "claude-sonnet-4-5", - "display_name": "claude-sonnet-4-5", + "id": "o3", + "name": "OpenAI o3", + "display_name": "OpenAI o3", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -3501,9 +3124,9 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -3511,39 +3134,48 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 3, - "output": 15 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "gpt-5", - "name": "gpt-5", - "display_name": "gpt-5", + "id": "o1-mini", + "name": "OpenAI: o1-mini", + "display_name": "OpenAI: o1-mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 65536 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -3555,13 +3187,6 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -3569,139 +3194,102 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.25, - "output": 10 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "grok-4.20-beta-0309-reasoning", - "name": "grok-4.20-beta-0309-reasoning", - "display_name": "grok-4.20-beta-0309-reasoning", + "id": "grok-3", + "name": "xAI Grok 3", + "display_name": "xAI Grok 3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 2, - "output": 6 + "input": 3, + "output": 15, + "cache_read": 0.75 }, "type": "chat" }, { - "id": "claude-opus-4-20250514", - "name": "claude-opus-4-20250514", - "display_name": "claude-opus-4-20250514", + "id": "grok-4-fast-non-reasoning", + "name": "xAI Grok 4 Fast Non-Reasoning", + "display_name": "xAI Grok 4 Fast Non-Reasoning", "modalities": { "input": [ "text", "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 32000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 15, - "output": 75 - }, - "type": "chat" - }, - { - "id": "glm-for-coding", - "name": "glm-for-coding", - "display_name": "glm-for-coding", - "modalities": { - "input": [ - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2025-09", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 0.086, - "output": 0.343 + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929-thinking", - "name": "claude-sonnet-4-5-20250929-thinking", - "display_name": "claude-sonnet-4-5-20250929-thinking", + "id": "grok-4-fast-reasoning", + "name": "xAI: Grok 4 Fast Reasoning", + "display_name": "xAI: Grok 4 Fast Reasoning", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, @@ -3711,25 +3299,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2025-09", + "release_date": "2025-09-01", + "last_updated": "2025-09-01", "cost": { - "input": 3, - "output": 15 + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 }, "type": "chat" }, { - "id": "glm-4.5-airx", - "name": "glm-4.5-airx", - "display_name": "glm-4.5-airx", + "id": "sonar-pro", + "name": "Perplexity Sonar Pro", + "display_name": "Perplexity Sonar Pro", "modalities": { "input": [ "text" @@ -3739,76 +3327,75 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0.572, - "output": 1.714 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "gpt-4.1", - "display_name": "gpt-4.1", + "id": "llama-3.1-8b-instruct", + "name": "Meta Llama 3.1 8B Instruct", + "display_name": "Meta Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 16384, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-07", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 2, - "output": 8 + "input": 0.02, + "output": 0.049999999999999996 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "kimi-k2-thinking", - "display_name": "kimi-k2-thinking", + "id": "gpt-5", + "name": "OpenAI GPT-5", + "display_name": "OpenAI GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -3817,29 +3404,40 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.575, - "output": 2.3 + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 }, "type": "chat" }, { - "id": "gemini-2.0-flash-lite", - "name": "gemini-2.0-flash-lite", - "display_name": "gemini-2.0-flash-lite", + "id": "llama-guard-4", + "name": "Meta Llama Guard 4 12B", + "display_name": "Meta Llama Guard 4 12B", "modalities": { "input": [ "text", @@ -3850,171 +3448,118 @@ ] }, "limit": { - "context": 2000000, - "output": 8192 + "context": 131072, + "output": 1024 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-06-16", - "last_updated": "2025-06-16", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.075, - "output": 0.3 + "input": 0.21, + "output": 0.21 }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "gpt-4.1-mini", - "display_name": "gpt-4.1-mini", + "id": "deepseek-v3.1-terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ - "text", - "image", - "pdf" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 1047576, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 0.4, - "output": 1.6 - }, - "type": "chat" - }, - { - "id": "grok-4-fast-non-reasoning", - "name": "grok-4-fast-non-reasoning", - "display_name": "grok-4-fast-non-reasoning", - "modalities": { - "input": [ - "text", - "image" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "knowledge": "2025-09", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.27, + "output": 1, + "cache_read": 0.21600000000000003 }, "type": "chat" - }, + } + ] + }, + "auriko": { + "id": "auriko", + "name": "Auriko", + "display_name": "Auriko", + "api": "https://api.auriko.ai/v1", + "doc": "https://docs.auriko.ai", + "models": [ { - "id": "doubao-seed-1-6-thinking-250715", - "name": "doubao-seed-1-6-thinking-250715", - "display_name": "doubao-seed-1-6-thinking-250715", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16000 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-07-15", - "last_updated": "2025-07-15", - "cost": { - "input": 0.121, - "output": 1.21 - }, - "type": "chat" - }, - { - "id": "ministral-14b-2512", - "name": "ministral-14b-2512", - "display_name": "ministral-14b-2512", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 128000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.33, - "output": 0.33 + "input": 0.5, + "output": 2.8 }, "type": "chat" - } - ] - }, - "alibaba": { - "id": "alibaba", - "name": "alibaba", - "display_name": "alibaba", - "api": "https://dashscope-intl.aliyuncs.com/compatible-mode/v1", - "doc": "https://www.alibabacloud.com/help/en/model-studio/models", - "models": [ + }, { - "id": "qwen3-235b-a22b", - "name": "Qwen3 235B A22B", - "display_name": "Qwen3 235B A22B", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -4024,19 +3569,14 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -4050,34 +3590,34 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.7, - "output": 2.8, - "reasoning": 8.4 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "qwen3.5-122b-a10b", - "name": "Qwen3.5 122B-A10B", - "display_name": "Qwen3.5 122B-A10B", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", "image", + "audio", "video", - "audio" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1048576, "output": 65536 }, "temperature": true, @@ -4089,28 +3629,54 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-23", - "last_updated": "2026-02-23", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.4, - "output": 3.2 + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + }, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -4121,42 +3687,52 @@ }, "limit": { "context": 1000000, - "output": 65536 + "output": 384000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 1, - "output": 5 + "input": 0.435, + "output": 0.87, + "cache_read": 0.003625 }, "type": "chat" }, { - "id": "qwen3.6-27b", - "name": "Qwen3.6 27B", - "display_name": "Qwen3.6 27B", + "id": "minimax-m2-7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -4164,211 +3740,210 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.6, - "output": 3.6 + "input": 0.3, + "output": 1.2, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "qwen3.5-27b", - "name": "Qwen3.5 27B", - "display_name": "Qwen3.5 27B", + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", "image", - "video", - "audio" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-23", - "last_updated": "2026-02-23", - "cost": { - "input": 0.3, - "output": 2.4 - }, - "type": "chat" - }, - { - "id": "qwen-vl-ocr", - "name": "Qwen Vl Ocr", - "display_name": "Qwen Vl Ocr", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 34096, - "output": 4096 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-10-28", - "last_updated": "2025-04-13", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.72, - "output": 0.72 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "qwen-omni-turbo-realtime", - "name": "Qwen-Omni Turbo Realtime", - "display_name": "Qwen-Omni Turbo Realtime", + "id": "qwen-3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ "text", "image", - "audio" + "video" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-08", - "last_updated": "2025-05-08", + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.27, - "output": 1.07, - "input_audio": 4.44, - "output_audio": 8.89 + "input": 0.5, + "output": 3, + "cache_read": 0.1, + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5 + }, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5, + "tier": { + "type": "context", + "size": 256000 + } + } + ] }, "type": "chat" }, { - "id": "qwen3-8b", - "name": "Qwen3 8B", - "display_name": "Qwen3 8B", + "id": "claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], "interleaved": true, "summaries": true, - "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.18, - "output": 0.7, - "reasoning": 2.1 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "qwen3.5-397b-a17b", - "name": "Qwen3.5 397B-A17B", - "display_name": "Qwen3.5 397B-A17B", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -4387,75 +3962,93 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-02-15", - "last_updated": "2026-02-15", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.6, - "output": 3.6 + "input": 0.14, + "output": 0.28, + "cache_read": 0.0028 }, "type": "chat" }, { - "id": "qwq-plus", - "name": "QwQ Plus", - "display_name": "QwQ Plus", + "id": "gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 32768, - "min": 0, - "max": 32768 - } + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-03-05", - "last_updated": "2025-03-05", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.8, - "output": 2.4 + "input": 2, + "output": 12, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "qwen-vl-plus", - "name": "Qwen-VL Plus", - "display_name": "Qwen-VL Plus", + "id": "grok-4.3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ "text", @@ -4466,117 +4059,172 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", - "last_updated": "2025-08-15", + "release_date": "2026-05-01", + "last_updated": "2026-05-01", "cost": { - "input": 0.21, - "output": 0.63 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2, + "context_over_200k": { + "input": 2.5, + "output": 5, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 2.5, + "output": 5, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "qwen3-livetranslate-flash-realtime", - "name": "Qwen3-LiveTranslate Flash Realtime", - "display_name": "Qwen3-LiveTranslate Flash Realtime", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", "audio", - "video" + "video", + "pdf" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 53248, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 10, - "output": 10, - "input_audio": 10, - "output_audio": 38 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.7, - "output": 2.8, - "reasoning": 8.4 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "qwen-max", - "name": "Qwen Max", - "display_name": "Qwen Max", + "id": "minimax-m2-7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ "text" @@ -4586,57 +4234,49 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "search": { "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-04-03", - "last_updated": "2025-01-25", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1.6, - "output": 6.4 + "input": 0.6, + "output": 2.4, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "qwen-plus", - "name": "Qwen Plus", - "display_name": "Qwen Plus", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -4649,42 +4289,43 @@ ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", - "last_updated": "2025-09-11", + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.4, - "output": 1.2, - "reasoning": 4 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" - }, + } + ] + }, + "firepass": { + "id": "firepass", + "name": "Fireworks (Firepass)", + "display_name": "Fireworks (Firepass)", + "api": "https://api.fireworks.ai/inference/v1/", + "doc": "https://docs.fireworks.ai/firepass", + "models": [ { - "id": "qwen3.6-35b-a3b", - "name": "Qwen3.6 35B-A3B", - "display_name": "Qwen3.6 35B-A3B", + "id": "accounts/fireworks/routers/kimi-k2p6-turbo", + "name": "Kimi K2.6 Turbo", + "display_name": "Kimi K2.6 Turbo", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -4703,58 +4344,60 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, "release_date": "2026-04-17", "last_updated": "2026-04-17", "cost": { - "input": 0.248, - "output": 1.485 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" - }, + } + ] + }, + "nano-gpt": { + "id": "nano-gpt", + "name": "NanoGPT", + "display_name": "NanoGPT", + "api": "https://nano-gpt.com/api/v1", + "doc": "https://docs.nano-gpt.com", + "models": [ { - "id": "qwen-omni-turbo", - "name": "Qwen-Omni Turbo", - "display_name": "Qwen-Omni Turbo", + "id": "glm-zero-preview", + "name": "GLM Zero Preview", + "display_name": "GLM Zero Preview", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 8000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-19", - "last_updated": "2025-03-26", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.07, - "output": 0.27, - "input_audio": 4.44, - "output_audio": 8.89 + "input": 1.802, + "output": 1.802 }, "type": "chat" }, { - "id": "qwen-flash", - "name": "Qwen Flash", - "display_name": "Qwen Flash", + "id": "qwen3-30b-a3b-instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ "text" @@ -4764,100 +4407,71 @@ ] }, "limit": { - "context": 1000000, + "context": 256000, "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-02-20", + "last_updated": "2025-02-20", "cost": { - "input": 0.05, - "output": 0.4 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "qwen2-5-vl-7b-instruct", - "name": "Qwen2.5-VL 7B Instruct", - "display_name": "Qwen2.5-VL 7B Instruct", + "id": "hunyuan-t1-latest", + "name": "Hunyuan T1", + "display_name": "Hunyuan T1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "open_weights": false, + "release_date": "2025-03-22", + "last_updated": "2025-03-22", "cost": { - "input": 0.35, - "output": 1.05 + "input": 0.17, + "output": 0.66 }, "type": "chat" }, { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "claude-opus-4-thinking:32000", + "name": "Claude 4 Opus Thinking (32K)", + "display_name": "Claude 4 Opus Thinking (32K)", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 200000, + "output": 32000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -4866,31 +4480,23 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.276, - "output": 1.651, - "cache_read": 0.028, - "cache_write": 0.344 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "Llama-3.3-70B-GeneticLemonade-Opus", + "name": "Llama 3.3 70B GeneticLemonade Opus", + "display_name": "Llama 3.3 70B GeneticLemonade Opus", "modalities": { "input": [ "text" @@ -4900,90 +4506,59 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 1.2, - "output": 6 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "qwen3-omni-flash", - "name": "Qwen3-Omni Flash", - "display_name": "Qwen3-Omni Flash", + "id": "claude-opus-4-1-20250805", + "name": "Claude 4.1 Opus", + "display_name": "Claude 4.1 Opus", "modalities": { "input": [ "text", "image", - "audio", - "video" + "pdf" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 200000, + "output": 32000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.43, - "output": 1.66, - "input_audio": 3.81, - "output_audio": 15.11 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "qwen2-5-72b-instruct", - "name": "Qwen2.5 72B Instruct", - "display_name": "Qwen2.5 72B Instruct", + "id": "command-a-reasoning-08-2025", + "name": "Cohere Command A (08/2025)", + "display_name": "Cohere Command A (08/2025)", "modalities": { "input": [ "text" @@ -4993,107 +4568,87 @@ ] }, "limit": { - "context": 131072, + "context": 256000, "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "open_weights": false, + "release_date": "2025-08-22", + "last_updated": "2025-08-22", "cost": { - "input": 1.4, - "output": 5.6 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b", - "name": "Qwen3-VL 235B-A22B", - "display_name": "Qwen3-VL 235B-A22B", + "id": "Llama-3.3-70B-Magnum-v4-SE", + "name": "Llama 3.3 70B Magnum v4 SE", + "display_name": "Llama 3.3 70B Magnum v4 SE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.7, - "output": 2.8, - "reasoning": 8.4 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "qwen3-asr-flash", - "name": "Qwen3-ASR Flash", - "display_name": "Qwen3-ASR Flash", + "id": "Llama-3.3-70B-The-Omega-Directive-Unslop-v2.1", + "name": "Llama 3.3 70B Omega Directive Unslop v2.1", + "display_name": "Llama 3.3 70B Omega Directive Unslop v2.1", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 53248, - "output": 4096 + "context": 32768, + "output": 16384 }, - "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-08", - "last_updated": "2025-09-08", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.035, - "output": 0.035 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "Llama-3.3-70B-StrawberryLemonade-v1.0", + "name": "Llama 3.3 70B StrawberryLemonade v1.0", + "display_name": "Llama 3.3 70B StrawberryLemonade v1.0", "modalities": { "input": [ "text" @@ -5103,56 +4658,37 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 32768, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.5, - "output": 6 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "qwen-mt-plus", - "name": "Qwen Mt Plus", - "display_name": "Qwen Mt Plus", + "id": "hidream", + "name": "Hidream", + "display_name": "Hidream", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 16384, + "context": 8192, "output": 8192 }, "temperature": true, @@ -5160,21 +4696,16 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01", - "last_updated": "2025-01", - "cost": { - "input": 2.46, - "output": 7.37 - }, + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "type": "chat" }, { - "id": "qwen-vl-max", - "name": "Qwen-VL Max", - "display_name": "Qwen-VL Max", + "id": "glm-4.1v-thinking-flashx", + "name": "GLM 4.1V Thinking FlashX", + "display_name": "GLM 4.1V Thinking FlashX", "modalities": { "input": [ "text", @@ -5185,61 +4716,79 @@ ] }, "limit": { - "context": 131072, + "context": 64000, "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-04-08", - "last_updated": "2025-08-13", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.8, - "output": 3.2 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen3-coder-flash", - "name": "Qwen3 Coder Flash", - "display_name": "Qwen3 Coder Flash", + "id": "gemini-2.5-flash-preview-04-17:thinking", + "name": "Gemini 2.5 Flash Preview Thinking", + "display_name": "Gemini 2.5 Flash Preview Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 1048756, "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-04-17", + "last_updated": "2025-04-17", "cost": { - "input": 0.3, - "output": 1.5 + "input": 0.15, + "output": 3.5 }, "type": "chat" }, { - "id": "qwen2-5-7b-instruct", - "name": "Qwen2.5 7B Instruct", - "display_name": "Qwen2.5 7B Instruct", + "id": "auto-model-premium", + "name": "Auto model (Premium)", + "display_name": "Auto model (Premium)", "modalities": { "input": [ "text" @@ -5249,29 +4798,27 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 1000000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "open_weights": false, + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.175, - "output": 0.7 + "input": 9.996, + "output": 19.992 }, "type": "chat" }, { - "id": "qwen2-5-14b-instruct", - "name": "Qwen2.5 14B Instruct", - "display_name": "Qwen2.5 14B Instruct", + "id": "jamba-large-1.6", + "name": "Jamba Large 1.6", + "display_name": "Jamba Large 1.6", "modalities": { "input": [ "text" @@ -5281,61 +4828,58 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "open_weights": false, + "release_date": "2025-03-12", + "last_updated": "2025-03-12", "cost": { - "input": 0.35, - "output": 1.4 + "input": 1.989, + "output": 7.99 }, "type": "chat" }, { - "id": "qwen2-5-32b-instruct", - "name": "Qwen2.5 32B Instruct", - "display_name": "Qwen2.5 32B Instruct", + "id": "gemini-exp-1206", + "name": "Gemini 2.0 Pro 1206", + "display_name": "Gemini 2.0 Pro 1206", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 2097152, "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "attachment": true, + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.7, - "output": 2.8 + "input": 1.258, + "output": 4.998 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "Gemma-3-27B-CardProjector-v4", + "name": "Gemma 3 27B CardProjector v4", + "display_name": "Gemma 3 27B CardProjector v4", "modalities": { "input": [ "text" @@ -5345,196 +4889,203 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", + "open_weights": false, + "release_date": "2025-03-10", + "last_updated": "2025-03-10", "cost": { - "input": 0.5, - "output": 2 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "qwen-plus-character-ja", - "name": "Qwen Plus Character (Japanese)", - "display_name": "Qwen Plus Character (Japanese)", + "id": "gemini-3-pro-image-preview", + "name": "Gemini 3 Pro Image", + "display_name": "Gemini 3 Pro Image", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 512 + "context": 1048756, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01", - "last_updated": "2024-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.5, - "output": 1.4 + "input": 2, + "output": 12 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "qwen3-omni-flash-realtime", - "name": "Qwen3-Omni Flash Realtime", - "display_name": "Qwen3-Omni Flash Realtime", + "id": "claude-3-7-sonnet-thinking:8192", + "name": "Claude 3.7 Sonnet Thinking (8K)", + "display_name": "Claude 3.7 Sonnet Thinking (8K)", "modalities": { "input": [ "text", "image", - "audio", - "video" + "pdf" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 200000, + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 0.52, - "output": 1.99, - "input_audio": 4.57, - "output_audio": 18.13 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "qwen3-vl-30b-a3b", - "name": "Qwen3-VL 30B-A3B", - "display_name": "Qwen3-VL 30B-A3B", + "id": "doubao-seed-2-0-lite-260215", + "name": "Doubao Seed 2.0 Lite", + "display_name": "Doubao Seed 2.0 Lite", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 256000, + "output": 32000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "cost": { - "input": 0.2, - "output": 0.8, - "reasoning": 2.4 + "input": 0.1462, + "output": 0.8738 }, "type": "chat" }, { - "id": "qwen3-vl-plus", - "name": "Qwen3 VL Plus", - "display_name": "Qwen3 VL Plus", + "id": "claude-sonnet-4-thinking:32768", + "name": "Claude 4 Sonnet Thinking (32K)", + "display_name": "Claude 4 Sonnet Thinking (32K)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 1000000, + "output": 64000 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.2, - "output": 1.6, - "reasoning": 4.8 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "Qwen3-Coder 480B-A35B Instruct", - "display_name": "Qwen3-Coder 480B-A35B Instruct", + "id": "doubao-seed-2-0-pro-260215", + "name": "Doubao Seed 2.0 Pro", + "display_name": "Doubao Seed 2.0 Pro", "modalities": { "input": [ "text" @@ -5544,29 +5095,27 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 256000, + "output": 128000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "cost": { - "input": 1.5, - "output": 7.5 + "input": 0.782, + "output": 3.876 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3-Coder 30B-A3B Instruct", - "display_name": "Qwen3-Coder 30B-A3B Instruct", + "id": "Llama-3.3-70B-Progenitor-V3.3", + "name": "Llama 3.3 70B Progenitor V3.3", + "display_name": "Llama 3.3 70B Progenitor V3.3", "modalities": { "input": [ "text" @@ -5576,251 +5125,204 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 0.45, - "output": 2.25 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "qwen-turbo", - "name": "Qwen Turbo", - "display_name": "Qwen Turbo", + "id": "gemini-2.5-pro-exp-03-25", + "name": "Gemini 2.5 Pro Experimental 0325", + "display_name": "Gemini 2.5 Pro Experimental 0325", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1048756, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-11-01", - "last_updated": "2025-04-28", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0.05, - "output": 0.2, - "reasoning": 0.5 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "qwen-mt-turbo", - "name": "Qwen Mt Turbo", - "display_name": "Qwen Mt Turbo", + "id": "ernie-4.5-turbo-vl-32k", + "name": "Ernie 4.5 Turbo VL 32k", + "display_name": "Ernie 4.5 Turbo VL 32k", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 32000, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01", - "last_updated": "2025-01", + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "cost": { - "input": 0.16, - "output": 0.49 + "input": 0.495, + "output": 1.43 }, "type": "chat" }, { - "id": "qwen3.6-max-preview", - "name": "Qwen3.6 Max Preview", - "display_name": "Qwen3.6 Max Preview", + "id": "deepseek-chat", + "name": "DeepSeek V3/Deepseek Chat", + "display_name": "DeepSeek V3/Deepseek Chat", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-20", - "last_updated": "2026-04-20", + "release_date": "2025-02-27", + "last_updated": "2025-02-27", "cost": { - "input": 1.3, - "output": 7.8, - "cache_read": 0.13, - "cache_write": 1.625 + "input": 0.25, + "output": 0.7 }, "type": "chat" }, { - "id": "qwen2-5-omni-7b", - "name": "Qwen2.5-Omni 7B", - "display_name": "Qwen2.5-Omni 7B", + "id": "step-3", + "name": "Step-3", + "display_name": "Step-3", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 65536, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-12", - "last_updated": "2024-12", + "attachment": true, + "open_weights": false, + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "cost": { - "input": 0.1, - "output": 0.4, - "input_audio": 6.76 + "input": 0.2499, + "output": 0.6494 }, "type": "chat" }, { - "id": "qwen3.5-plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "Llama-3.3-70B-RAWMAW", + "name": "Llama 3.3 70B RAWMAW", + "display_name": "Llama 3.3 70B RAWMAW", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.4, - "output": 2.4, - "reasoning": 2.4 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "qwen2-5-vl-72b-instruct", - "name": "Qwen2.5-VL 72B Instruct", - "display_name": "Qwen2.5-VL 72B Instruct", + "id": "GLM-4.5-Air-Derestricted-Iceblink-v2-ReExtract", + "name": "GLM 4.5 Air Derestricted Iceblink v2 ReExtract", + "display_name": "GLM 4.5 Air Derestricted Iceblink v2 ReExtract", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -5828,62 +5330,56 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "open_weights": false, + "release_date": "2025-12-12", + "last_updated": "2025-12-12", "cost": { - "input": 2.8, - "output": 8.4 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "qvq-max", - "name": "QVQ Max", - "display_name": "QVQ Max", + "id": "universal-summarizer", + "name": "Universal Summarizer", + "display_name": "Universal Summarizer", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32768, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "release_date": "2023-05-01", + "last_updated": "2024-01-01", "cost": { - "input": 1.2, - "output": 4.8 + "input": 30, + "output": 30 }, "type": "chat" }, { - "id": "qwen3-14b", - "name": "Qwen3 14B", - "display_name": "Qwen3 14B", + "id": "GLM-4.5-Air-Derestricted-Steam-ReExtract", + "name": "GLM 4.5 Air Derestricted Steam ReExtract", + "display_name": "GLM 4.5 Air Derestricted Steam ReExtract", "modalities": { "input": [ "text" @@ -5894,92 +5390,26 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", - "cost": { - "input": 0.35, - "output": 1.4, - "reasoning": 4.2 - }, - "type": "chat" - }, - { - "id": "qwen3.5-35b-a3b", - "name": "Qwen3.5 35B-A3B", - "display_name": "Qwen3.5 35B-A3B", - "modalities": { - "input": [ - "text", - "image", - "video", - "audio" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 65536 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-23", - "last_updated": "2026-02-23", + "open_weights": false, + "release_date": "2025-12-12", + "last_updated": "2025-12-12", "cost": { - "input": 0.25, - "output": 2 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "qwen3-coder-plus-2025-09-23", - "name": "Qwen3 Coder Plus 2025 09 23", - "display_name": "Qwen3 Coder Plus 2025 09 23", + "id": "Llama-3.3-70B-Shakudo", + "name": "Llama 3.3 70B Shakudo", + "display_name": "Llama 3.3 70B Shakudo", "modalities": { "input": [ "text" @@ -5989,70 +5419,57 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "type": "chat" - }, - { - "id": "qwen3-coder-plus-2025-07-22", - "name": "Qwen3 Coder Plus 2025 07 22", - "display_name": "Qwen3 Coder Plus 2025 07 22", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 65536 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.306, + "output": 0.306 }, - "attachment": false, "type": "chat" }, { - "id": "qwen-vl-ocr-latest", - "name": "Qwen Vl Ocr Latest", - "display_name": "Qwen Vl Ocr Latest", + "id": "Llama-3.3-70B-Predatorial-Extasy", + "name": "Llama 3.3 70B Predatorial Extasy", + "display_name": "Llama 3.3 70B Predatorial Extasy", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 34096, - "output": 4096 + "context": 32768, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.306, + "output": 0.306 + }, "type": "chat" }, { - "id": "qvq-max-2025-05-15", - "name": "Qvq Max 2025 05 15", - "display_name": "Qvq Max 2025 05 15", + "id": "gemini-2.5-pro-preview-03-25", + "name": "Gemini 2.5 Pro Preview 0325", + "display_name": "Gemini 2.5 Pro Preview 0325", "modalities": { "input": [ "text", @@ -6063,27 +5480,47 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048756, + "output": 65536 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 16384, - "min": 0, - "max": 16384 + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, + "attachment": true, + "open_weights": false, + "release_date": "2025-03-25", + "last_updated": "2025-03-25", + "cost": { + "input": 2.5, + "output": 10 + }, "type": "chat" }, { - "id": "qwen-long", - "name": "Qwen Long", - "display_name": "Qwen Long", + "id": "Llama-3.3-70B-Cu-Mai-R1", + "name": "Llama 3.3 70B Cu Mai R1", + "display_name": "Llama 3.3 70B Cu Mai R1", "modalities": { "input": [ "text" @@ -6093,139 +5530,116 @@ ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 32768, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.306, + "output": 0.306 + }, "type": "chat" }, { - "id": "qwen-turbo-latest", - "name": "Qwen Turbo Latest", - "display_name": "Qwen Turbo Latest", + "id": "gemini-2.5-flash-preview-09-2025", + "name": "Gemini 2.5 Flash Preview (09/2025)", + "display_name": "Gemini 2.5 Flash Preview (09/2025)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1048756, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "attachment": true, + "open_weights": false, + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "cost": { + "input": 0.3, + "output": 2.5 }, - "attachment": false, "type": "chat" }, { - "id": "qwen-turbo-2024-09-19", - "name": "Qwen Turbo 2024 09 19", - "display_name": "Qwen Turbo 2024 09 19", + "id": "ernie-x1.1-preview", + "name": "ERNIE X1.1", + "display_name": "ERNIE X1.1", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 64000, "output": 8192 }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "type": "chat" - }, - { - "id": "qwen-flash-2025-07-28", - "name": "Qwen Flash 2025 07 28", - "display_name": "Qwen Flash 2025 07 28", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 32768 - }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "attachment": true, + "open_weights": false, + "release_date": "2025-09-10", + "last_updated": "2025-09-10", + "cost": { + "input": 0.15, + "output": 0.6 }, - "attachment": false, "type": "chat" }, { - "id": "qwen-plus-latest", - "name": "Qwen Plus Latest", - "display_name": "Qwen Plus Latest", + "id": "deepseek-r1", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ "text" @@ -6235,19 +5649,13 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 128000, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -6260,19 +5668,20 @@ ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, + "open_weights": false, + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "cost": { + "input": 0.4, + "output": 1.7 + }, "type": "chat" }, { - "id": "qwen-plus-2024-09-19", - "name": "Qwen Plus 2024 09 19", - "display_name": "Qwen Plus 2024 09 19", + "id": "glm-z1-airx", + "name": "GLM Z1 AirX", + "display_name": "GLM Z1 AirX", "modalities": { "input": [ "text" @@ -6282,68 +5691,59 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", + "cost": { + "input": 0.7, + "output": 0.7 + }, "type": "chat" }, { - "id": "qwen-plus-2025-07-14", - "name": "Qwen Plus 2025 07 14", - "display_name": "Qwen Plus 2025 07 14", + "id": "claude-haiku-4-5-20251001", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 200000, + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "attachment": true, + "open_weights": false, + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "cost": { + "input": 1, + "output": 5 }, - "attachment": false, "type": "chat" }, { - "id": "qwen-plus-2025-09-11", - "name": "Qwen Plus 2025 09 11", - "display_name": "Qwen Plus 2025 09 11", + "id": "v0-1.5-md", + "name": "v0 1.5 MD", + "display_name": "v0 1.5 MD", "modalities": { "input": [ "text" @@ -6353,77 +5753,63 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 200000, + "output": 64000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2025-07-04", + "last_updated": "2025-07-04", + "cost": { + "input": 3, + "output": 15 + }, "type": "chat" }, { - "id": "qwen-max-latest", - "name": "Qwen Max Latest", - "display_name": "Qwen Max Latest", + "id": "claude-3-5-sonnet-20240620", + "name": "Claude 3.5 Sonnet Old", + "display_name": "Claude 3.5 Sonnet Old", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 200000, "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "attachment": true, + "open_weights": false, + "release_date": "2024-06-20", + "last_updated": "2024-06-20", + "cost": { + "input": 2.992, + "output": 14.994 }, - "attachment": false, "type": "chat" }, { - "id": "qwen-max-2024-09-19", - "name": "Qwen Max 2024 09 19", - "display_name": "Qwen Max 2024 09 19", + "id": "qwen3-vl-235b-a22b-thinking", + "name": "Qwen3 VL 235B A22B Thinking", + "display_name": "Qwen3 VL 235B A22B Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -6431,26 +5817,38 @@ }, "limit": { "context": 32768, - "output": 8192 + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false - }, - "search": { "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-26", + "last_updated": "2025-08-26", + "cost": { + "input": 0.5, + "output": 6 }, - "attachment": false, "type": "chat" }, { - "id": "qwen-max-2024-04-28", - "name": "Qwen Max 2024 04 28", - "display_name": "Qwen Max 2024 04 28", + "id": "glm-4-plus", + "name": "GLM-4 Plus", + "display_name": "GLM-4 Plus", "modalities": { "input": [ "text" @@ -6460,21 +5858,27 @@ ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 128000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2024-08-01", + "last_updated": "2024-08-01", + "cost": { + "input": 7.497, + "output": 7.497 + }, "type": "chat" }, { - "id": "qwen-max-2024-04-03", - "name": "Qwen Max 2024 04 03", - "display_name": "Qwen Max 2024 04 03", + "id": "fastgpt", + "name": "Web Answer", + "display_name": "Web Answer", "modalities": { "input": [ "text" @@ -6484,21 +5888,27 @@ ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 32768, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2023-08-01", + "last_updated": "2024-01-01", + "cost": { + "input": 7.5, + "output": 7.5 + }, "type": "chat" }, { - "id": "qwen-max-2025-01-25", - "name": "Qwen Max 2025 01 25", - "display_name": "Qwen Max 2025 01 25", + "id": "Llama-3.3-70B-Anthrobomination", + "name": "Llama 3.3 70B Anthrobomination", + "display_name": "Llama 3.3 70B Anthrobomination", "modalities": { "input": [ "text" @@ -6508,27 +5918,27 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.306, + "output": 0.306 + }, "type": "chat" }, { - "id": "qwen3-max-2025-09-23", - "name": "Qwen3 Max 20250923", - "display_name": "Qwen3 Max 20250923", + "id": "Llama-3.3-70B-Ignition-v0.1", + "name": "Llama 3.3 70B Ignition v0.1", + "display_name": "Llama 3.3 70B Ignition v0.1", "modalities": { "input": [ "text" @@ -6538,68 +5948,78 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.306, + "output": 0.306 + }, "type": "chat" }, { - "id": "qwen3-max-preview", - "name": "Qwen3 Max Preview", - "display_name": "Qwen3 Max Preview", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1048756, "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "attachment": true, + "open_weights": false, + "release_date": "2025-06-05", + "last_updated": "2025-06-05", + "cost": { + "input": 2.5, + "output": 10 }, - "attachment": false, "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "exa-research", + "name": "Exa (Research)", + "display_name": "Exa (Research)", "modalities": { "input": [ "text" @@ -6609,62 +6029,58 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 8192, + "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2025-06-04", + "last_updated": "2025-06-04", + "cost": { + "input": 2.5, + "output": 2.5 + }, "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "gemini-2.0-pro-exp-02-05", + "name": "Gemini 2.0 Pro 0205", + "display_name": "Gemini 2.0 Pro 0205", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 2097152, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, + "open_weights": false, + "release_date": "2025-02-05", + "last_updated": "2025-02-05", + "cost": { + "input": 1.989, + "output": 7.956 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b-instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", + "id": "ernie-4.5-8k-preview", + "name": "Ernie 4.5 8k Preview", + "display_name": "Ernie 4.5 8k Preview", "modalities": { "input": [ "text" @@ -6674,21 +6090,27 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 8000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2025-03-25", + "last_updated": "2025-03-25", + "cost": { + "input": 0.66, + "output": 2.6 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b-thinking-2507", - "name": "Qwen3 30B A3B Thinking 2507", - "display_name": "Qwen3 30B A3B Thinking 2507", + "id": "auto-model-basic", + "name": "Auto model (Basic)", + "display_name": "Auto model (Basic)", "modalities": { "input": [ "text" @@ -6698,38 +6120,27 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1000000, + "output": 1000000 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2024-06-01", + "last_updated": "2024-06-01", + "cost": { + "input": 9.996, + "output": 19.992 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "glm-4-long", + "name": "GLM-4 Long", + "display_name": "GLM-4 Long", "modalities": { "input": [ "text" @@ -6739,38 +6150,27 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1000000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2024-08-01", + "last_updated": "2024-08-01", + "cost": { + "input": 0.2006, + "output": 0.2006 + }, "type": "chat" }, { - "id": "qwen3-4b", - "name": "Qwen3 4B", - "display_name": "Qwen3 4B", + "id": "qwq-32b", + "name": "Qwen: QwQ 32B", + "display_name": "Qwen: QwQ 32B", "modalities": { "input": [ "text" @@ -6780,19 +6180,12 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "supported": true }, "extra_capabilities": { "reasoning": { @@ -6806,53 +6199,50 @@ } }, "attachment": false, + "open_weights": false, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", + "cost": { + "input": 0.25599999, + "output": 0.30499999 + }, "type": "chat" }, { - "id": "qwen3-1.7b", - "name": "Qwen3 1.7B", - "display_name": "Qwen3 1.7B", + "id": "doubao-1-5-thinking-pro-250415", + "name": "Doubao 1.5 Thinking Pro", + "display_name": "Doubao 1.5 Thinking Pro", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 30720, - "min": 0, - "max": 30720 - } + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": true, + "open_weights": false, + "release_date": "2025-04-17", + "last_updated": "2025-04-17", + "cost": { + "input": 0.6, + "output": 2.4 }, - "attachment": false, "type": "chat" }, { - "id": "qwen3-0.6b", - "name": "Qwen3 0.6B", - "display_name": "Qwen3 0.6B", + "id": "Llama-3.3-70B-GeneticLemonade-Unleashed-v3", + "name": "Llama 3.3 70B GeneticLemonade Unleashed v3", + "display_name": "Llama 3.3 70B GeneticLemonade Unleashed v3", "modalities": { "input": [ "text" @@ -6863,132 +6253,108 @@ }, "limit": { "context": 32768, - "output": 8192 + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 30720, - "min": 0, - "max": 30720 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.306, + "output": 0.306 + }, "type": "chat" }, { - "id": "qwen3-vl-plus-2025-09-23", - "name": "Qwen3 VL Plus 2025 09 23", - "display_name": "Qwen3 VL Plus 2025 09 23", + "id": "exa-research-pro", + "name": "Exa (Research Pro)", + "display_name": "Exa (Research Pro)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 16384, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2025-06-04", + "last_updated": "2025-06-04", + "cost": { + "input": 2.5, + "output": 2.5 + }, "type": "chat" }, { - "id": "qwq-plus-latest", - "name": "QwQ Plus Latest", - "display_name": "QwQ Plus Latest", + "id": "gemini-2.5-flash-preview-04-17", + "name": "Gemini 2.5 Flash Preview", + "display_name": "Gemini 2.5 Flash Preview", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048756, + "output": 65536 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 32768, - "min": 0, - "max": 32768 - } + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "search": { - "supported": false + "attachment": true, + "open_weights": false, + "release_date": "2025-04-17", + "last_updated": "2025-04-17", + "cost": { + "input": 0.15, + "output": 0.6 }, - "attachment": false, "type": "chat" - } - ] - }, - "scaleway": { - "id": "scaleway", - "name": "Scaleway", - "display_name": "Scaleway", - "api": "https://api.scaleway.ai/v1", - "doc": "https://www.scaleway.com/en/docs/generative-apis/", - "models": [ + }, { - "id": "qwen3-embedding-8b", - "name": "Qwen3 Embedding 8B", - "display_name": "Qwen3 Embedding 8B", + "id": "doubao-seed-2-0-code-preview-260215", + "name": "Doubao Seed 2.0 Code Preview", + "display_name": "Doubao Seed 2.0 Code Preview", "modalities": { "input": [ "text" @@ -6998,28 +6364,27 @@ ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 256000, + "output": 128000 }, - "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-25-11", - "last_updated": "2026-03-17", + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "cost": { - "input": 0.1, - "output": 0 + "input": 0.782, + "output": 3.893 }, - "type": "embedding" + "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "Llama-3.3-70B-Bigger-Body", + "name": "Llama 3.3 70B Bigger Body", + "display_name": "Llama 3.3 70B Bigger Body", "modalities": { "input": [ "text" @@ -7029,28 +6394,27 @@ ] }, "limit": { - "context": 260000, + "context": 32768, "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.75, - "output": 2.25 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "Llama-3.3-70B-Fallen-v1", + "name": "Llama 3.3 70B Fallen v1", + "display_name": "Llama 3.3 70B Fallen v1", "modalities": { "input": [ "text" @@ -7060,75 +6424,27 @@ ] }, "limit": { - "context": 100000, + "context": 32768, "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2026-03-17", - "cost": { - "input": 0.9, - "output": 0.9 - }, - "type": "chat" - }, - { - "id": "qwen3.5-397b-a17b", - "name": "Qwen3.5 397B A17B", - "display_name": "Qwen3.5 397B A17B", - "modalities": { - "input": [ - "text", - "image", - "video" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 16384 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.6, - "output": 3.6 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "devstral-2-123b-instruct-2512", - "name": "Devstral 2 123B Instruct (2512)", - "display_name": "Devstral 2 123B Instruct (2512)", + "id": "Llama-3.3-70B-Electra-R1", + "name": "Llama 3.3 70B Electra R1", + "display_name": "Llama 3.3 70B Electra R1", "modalities": { "input": [ "text" @@ -7138,28 +6454,27 @@ ] }, "limit": { - "context": 256000, + "context": 32768, "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-07", - "last_updated": "2026-03-17", + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.4, - "output": 2 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "azure-o1", + "name": "Azure o1", + "display_name": "Azure o1", "modalities": { "input": [ "text" @@ -7169,39 +6484,30 @@ ] }, "limit": { - "context": 32000, - "output": 8196 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2026-03-17", + "open_weights": false, + "release_date": "2024-12-17", + "last_updated": "2024-12-17", "cost": { - "input": 0.9, - "output": 0.9 + "input": 14.994, + "output": 59.993 }, "type": "chat" }, { - "id": "pixtral-12b-2409", - "name": "Pixtral 12B 2409", - "display_name": "Pixtral 12B 2409", + "id": "deepseek-v3-0324", + "name": "DeepSeek Chat 0324", + "display_name": "DeepSeek Chat 0324", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -7209,125 +6515,122 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2024-09-25", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": false, + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.25, + "output": 0.7 }, "type": "chat" }, { - "id": "whisper-large-v3", - "name": "Whisper Large v3", - "display_name": "Whisper Large v3", + "id": "chroma", + "name": "Chroma", + "display_name": "Chroma", "modalities": { "input": [ - "audio" + "text" ], "output": [ - "text" + "image" ] }, "limit": { "context": 8192, "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-09", - "release_date": "2023-09-01", - "last_updated": "2026-03-17", - "cost": { - "input": 0.003, - "output": 0 - }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-12", + "last_updated": "2025-08-12", "type": "chat" }, { - "id": "voxtral-small-24b-2507", - "name": "Voxtral Small 24B 2507", - "display_name": "Voxtral Small 24B 2507", + "id": "claude-sonnet-4-5-20250929-thinking", + "name": "Claude Sonnet 4.5 Thinking", + "display_name": "Claude Sonnet 4.5 Thinking", "modalities": { "input": [ "text", - "audio" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 16384 + "context": 1000000, + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2026-03-17", + "open_weights": false, + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.15, - "output": 0.35 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "gemma-3-27b-it", - "name": "Gemma-3-27B-IT", - "display_name": "Gemma-3-27B-IT", + "id": "jamba-large", + "name": "Jamba Large", + "display_name": "Jamba Large", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 40000, - "output": 8192 + "context": 256000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2026-03-17", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.25, - "output": 0.5 + "input": 1.989, + "output": 7.99 }, "type": "chat" }, { - "id": "bge-multilingual-gemma2", - "name": "BGE Multilingual Gemma2", - "display_name": "BGE Multilingual Gemma2", + "id": "Llama-3.3-70B-Nova", + "name": "Llama 3.3 70B Nova", + "display_name": "Llama 3.3 70B Nova", "modalities": { "input": [ "text" @@ -7337,92 +6640,84 @@ ] }, "limit": { - "context": 8191, - "output": 3072 + "context": 32768, + "output": 16384 }, - "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-07-26", - "last_updated": "2025-06-15", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.1, - "output": 0 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3-Coder 30B-A3B Instruct", - "display_name": "Qwen3-Coder 30B-A3B Instruct", + "id": "z-image-turbo", + "name": "Z Image Turbo", + "display_name": "Z Image Turbo", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2026-03-17", - "cost": { - "input": 0.2, - "output": 0.8 - }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-27", + "last_updated": "2025-11-27", "type": "chat" }, { - "id": "mistral-small-3.2-24b-instruct-2506", - "name": "Mistral Small 3.2 24B Instruct (2506)", - "display_name": "Mistral Small 3.2 24B Instruct (2506)", + "id": "jamba-mini-1.7", + "name": "Jamba Mini 1.7", + "display_name": "Jamba Mini 1.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 256000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-06-20", - "last_updated": "2026-03-17", + "open_weights": false, + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.15, - "output": 0.35 + "input": 0.1989, + "output": 0.408 }, "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "GPT-OSS 120B", - "display_name": "GPT-OSS 120B", + "id": "Llama-3.3-70B-Strawberrylemonade-v1.2", + "name": "Llama 3.3 70B StrawberryLemonade v1.2", + "display_name": "Llama 3.3 70B StrawberryLemonade v1.2", "modalities": { "input": [ "text" @@ -7432,33 +6727,27 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2024-01-01", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "mistral-nemo-instruct-2407", - "name": "Mistral Nemo Instruct 2407", - "display_name": "Mistral Nemo Instruct 2407", + "id": "doubao-seed-2-0-mini-260215", + "name": "Doubao Seed 2.0 Mini", + "display_name": "Doubao Seed 2.0 Mini", "modalities": { "input": [ "text" @@ -7468,28 +6757,27 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 256000, + "output": 32000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2024-07-25", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": false, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.0493, + "output": 0.4845 }, "type": "chat" }, { - "id": "llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "sonar", + "name": "Perplexity Simple", + "display_name": "Perplexity Simple", "modalities": { "input": [ "text" @@ -7499,38 +6787,27 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 127000, + "output": 128000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2026-03-17", + "open_weights": false, + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.2, - "output": 0.2 + "input": 1.003, + "output": 1.003 }, "type": "chat" - } - ] - }, - "nano-gpt": { - "id": "nano-gpt", - "name": "NanoGPT", - "display_name": "NanoGPT", - "api": "https://nano-gpt.com/api/v1", - "doc": "https://docs.nano-gpt.com", - "models": [ + }, { - "id": "glm-4-flash", - "name": "GLM-4 Flash", - "display_name": "GLM-4 Flash", + "id": "jamba-large-1.7", + "name": "Jamba Large 1.7", + "display_name": "Jamba Large 1.7", "modalities": { "input": [ "text" @@ -7540,7 +6817,7 @@ ] }, "limit": { - "context": 128000, + "context": 256000, "output": 4096 }, "tool_call": false, @@ -7549,18 +6826,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-08-01", - "last_updated": "2024-08-01", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.1003, - "output": 0.1003 + "input": 1.989, + "output": 7.99 }, "type": "chat" }, { - "id": "Meta-Llama-3-1-8B-Instruct-FP8", - "name": "Llama 3.1 8B (decentralized)", - "display_name": "Llama 3.1 8B (decentralized)", + "id": "glm-4-flash", + "name": "GLM-4 Flash", + "display_name": "GLM-4 Flash", "modalities": { "input": [ "text" @@ -7571,7 +6848,7 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, "tool_call": false, "reasoning": { @@ -7579,18 +6856,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2024-08-01", + "last_updated": "2024-08-01", "cost": { - "input": 0.02, - "output": 0.03 + "input": 0.1003, + "output": 0.1003 }, "type": "chat" }, { - "id": "claude-opus-4-thinking:32000", - "name": "Claude 4 Opus Thinking (32K)", - "display_name": "Claude 4 Opus Thinking (32K)", + "id": "claude-opus-4-1-thinking:8192", + "name": "Claude 4.1 Opus Thinking (8K)", + "display_name": "Claude 4.1 Opus Thinking (8K)", "modalities": { "input": [ "text", @@ -7627,60 +6904,39 @@ "type": "chat" }, { - "id": "gemini-2.5-pro-preview-05-06", - "name": "Gemini 2.5 Pro Preview 0506", - "display_name": "Gemini 2.5 Pro Preview 0506", + "id": "step-2-16k-exp", + "name": "Step-2 16k Exp", + "display_name": "Step-2 16k Exp", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 16000, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-06", - "last_updated": "2025-05-06", + "release_date": "2024-07-05", + "last_updated": "2024-07-05", "cost": { - "input": 2.5, - "output": 10 + "input": 7.004, + "output": 19.992 }, "type": "chat" }, { - "id": "grok-3-mini-fast-beta", - "name": "Grok 3 Mini Fast Beta", - "display_name": "Grok 3 Mini Fast Beta", + "id": "Llama-3.3-70B-Damascus-R1", + "name": "Damascus R1", + "display_name": "Damascus R1", "modalities": { "input": [ "text" @@ -7690,8 +6946,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -7699,21 +6955,23 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.6, - "output": 4 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "MiniMax-M2", - "name": "MiniMax M2", - "display_name": "MiniMax M2", + "id": "claude-opus-4-1-thinking:32000", + "name": "Claude 4.1 Opus Thinking (32K)", + "display_name": "Claude 4.1 Opus Thinking (32K)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -7721,7 +6979,45 @@ }, "limit": { "context": 200000, - "output": 131072 + "output": 32000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 14.994, + "output": 75.004 + }, + "type": "chat" + }, + { + "id": "ernie-5.0-thinking-preview", + "name": "Ernie 5.0 Thinking Preview", + "display_name": "Ernie 5.0 Thinking Preview", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -7733,20 +7029,20 @@ "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-10-25", - "last_updated": "2025-10-25", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.17, - "output": 1.53 + "input": 1.1, + "output": 2 }, "type": "chat" }, { - "id": "command-a-reasoning-08-2025", - "name": "Cohere Command A (08/2025)", - "display_name": "Cohere Command A (08/2025)", + "id": "Llama-3.3-70B-Mokume-Gane-R1", + "name": "Llama 3.3 70B Mokume Gane R1", + "display_name": "Llama 3.3 70B Mokume Gane R1", "modalities": { "input": [ "text" @@ -7756,8 +7052,8 @@ ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -7765,18 +7061,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-08-22", - "last_updated": "2025-08-22", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 2.5, - "output": 10 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "brave", - "name": "Brave (Answers)", - "display_name": "Brave (Answers)", + "id": "grok-3-beta", + "name": "Grok 3 Beta", + "display_name": "Grok 3 Beta", "modalities": { "input": [ "text" @@ -7786,8 +7082,8 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 131072 }, "tool_call": false, "reasoning": { @@ -7795,18 +7091,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2023-03-02", - "last_updated": "2024-01-01", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 5, - "output": 5 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "exa-research", - "name": "Exa (Research)", - "display_name": "Exa (Research)", + "id": "GLM-4.5-Air-Derestricted-Iceblink", + "name": "GLM 4.5 Air Derestricted Iceblink", + "display_name": "GLM 4.5 Air Derestricted Iceblink", "modalities": { "input": [ "text" @@ -7816,8 +7112,8 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 98304 }, "tool_call": false, "reasoning": { @@ -7825,18 +7121,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-06-04", - "last_updated": "2025-06-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 2.5, - "output": 2.5 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Nova", - "name": "Llama 3.3 70B Nova", - "display_name": "Llama 3.3 70B Nova", + "id": "glm-4", + "name": "GLM-4", + "display_name": "GLM-4", "modalities": { "input": [ "text" @@ -7846,8 +7142,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -7855,30 +7151,31 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2024-01-16", + "last_updated": "2024-01-16", "cost": { - "input": 0.306, - "output": 0.306 + "input": 14.994, + "output": 14.994 }, "type": "chat" }, { - "id": "gemini-exp-1206", - "name": "Gemini 2.0 Pro 1206", - "display_name": "Gemini 2.0 Pro 1206", + "id": "ernie-x1-turbo-32k", + "name": "Ernie X1 Turbo 32k", + "display_name": "Ernie X1 Turbo 32k", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2097152, - "output": 8192 + "context": 32000, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -7886,18 +7183,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "cost": { - "input": 1.258, - "output": 4.998 + "input": 0.165, + "output": 0.66 }, "type": "chat" }, { - "id": "claude-opus-4-5-20251101", - "name": "Claude 4.5 Opus", - "display_name": "Claude 4.5 Opus", + "id": "claude-opus-4-1-thinking:32768", + "name": "Claude 4.1 Opus Thinking (32K)", + "display_name": "Claude 4.1 Opus Thinking (32K)", "modalities": { "input": [ "text", @@ -7917,20 +7214,26 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } + }, "attachment": true, "open_weights": false, - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 4.998, - "output": 25.007 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "auto-model-basic", - "name": "Auto model (Basic)", - "display_name": "Auto model (Basic)", + "id": "GLM-4.5-Air-Derestricted-Iceblink-v2", + "name": "GLM 4.5 Air Derestricted Iceblink v2", + "display_name": "GLM 4.5 Air Derestricted Iceblink v2", "modalities": { "input": [ "text" @@ -7940,8 +7243,8 @@ ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 158600, + "output": 65536 }, "tool_call": false, "reasoning": { @@ -7949,18 +7252,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 9.996, - "output": 19.992 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "jamba-mini", - "name": "Jamba Mini", - "display_name": "Jamba Mini", + "id": "Llama-3.3-70B-Legion-V2.1", + "name": "Llama 3.3 70B Legion V2.1", + "display_name": "Llama 3.3 70B Legion V2.1", "modalities": { "input": [ "text" @@ -7970,8 +7273,8 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -7979,70 +7282,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.1989, - "output": 0.408 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-09-2025", - "name": "Gemini 2.5 Flash Lite Preview (09/2025)", - "display_name": "Gemini 2.5 Flash Lite Preview (09/2025)", + "id": "deepseek-math-v2", + "name": "DeepSeek Math V2", + "display_name": "DeepSeek Math V2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, + "context": 128000, "output": 65536 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-12-03", + "last_updated": "2025-12-03", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "yi-large", - "name": "Yi Large", - "display_name": "Yi Large", + "id": "step-r1-v-mini", + "name": "Step R1 V Mini", + "display_name": "Step R1 V Mini", "modalities": { "input": [ "text" @@ -8052,8 +7333,8 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 128000, + "output": 65536 }, "tool_call": false, "reasoning": { @@ -8061,79 +7342,87 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "release_date": "2025-04-08", + "last_updated": "2025-04-08", "cost": { - "input": 3.196, - "output": 3.196 + "input": 2.5, + "output": 11 }, "type": "chat" }, { - "id": "auto-model-premium", - "name": "Auto model (Premium)", - "display_name": "Auto model (Premium)", + "id": "claude-opus-4-5-20251101:thinking", + "name": "Claude 4.5 Opus Thinking", + "display_name": "Claude 4.5 Opus Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { - "input": 9.996, - "output": 19.992 + "input": 4.998, + "output": 25.007 }, "type": "chat" }, { - "id": "azure-gpt-4o", - "name": "Azure gpt-4o", - "display_name": "Azure gpt-4o", + "id": "grok-3-mini-beta", + "name": "Grok 3 Mini Beta", + "display_name": "Grok 3 Mini Beta", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 131072 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 2.499, - "output": 9.996 + "input": 0.3, + "output": 0.5 }, "type": "chat" }, { - "id": "deepseek-v3-0324", - "name": "DeepSeek Chat 0324", - "display_name": "DeepSeek Chat 0324", + "id": "brave-research", + "name": "Brave (Research)", + "display_name": "Brave (Research)", "modalities": { "input": [ "text" @@ -8143,27 +7432,27 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 16384, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "release_date": "2023-03-02", + "last_updated": "2024-01-01", "cost": { - "input": 0.25, - "output": 0.7 + "input": 5, + "output": 5 }, "type": "chat" }, { - "id": "claude-3-5-haiku-20241022", - "name": "Claude 3.5 Haiku", - "display_name": "Claude 3.5 Haiku", + "id": "claude-3-7-sonnet-thinking:1024", + "name": "Claude 3.7 Sonnet Thinking (1K)", + "display_name": "Claude 3.7 Sonnet Thinking (1K)", "modalities": { "input": [ "text", @@ -8176,26 +7465,47 @@ }, "limit": { "context": 200000, - "output": 8192 + "output": 64000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 0.8, - "output": 4 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "doubao-seed-1-8-251215", - "name": "Doubao Seed 1.8", - "display_name": "Doubao Seed 1.8", + "id": "venice-uncensored", + "name": "Venice Uncensored", + "display_name": "Venice Uncensored", "modalities": { "input": [ "text" @@ -8206,7 +7516,7 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 16384 }, "tool_call": false, "reasoning": { @@ -8214,18 +7524,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-15", - "last_updated": "2025-12-15", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 0.612, - "output": 6.12 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "doubao-seed-1-6-250615", - "name": "Doubao Seed 1.6", - "display_name": "Doubao Seed 1.6", + "id": "doubao-1.5-pro-256k", + "name": "Doubao 1.5 Pro 256k", + "display_name": "Doubao 1.5 Pro 256k", "modalities": { "input": [ "text" @@ -8244,44 +7554,60 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-06-15", - "last_updated": "2025-06-15", + "release_date": "2025-03-12", + "last_updated": "2025-03-12", "cost": { - "input": 0.204, - "output": 0.51 + "input": 0.799, + "output": 1.445 }, "type": "chat" }, { - "id": "ernie-x1.1-preview", - "name": "ERNIE X1.1", - "display_name": "ERNIE X1.1", + "id": "gemini-2.5-flash-preview-05-20", + "name": "Gemini 2.5 Flash 0520", + "display_name": "Gemini 2.5 Flash 0520", "modalities": { "input": [ "text", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 8192 + "context": 1048000, + "output": 65536 }, "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-09-10", - "last_updated": "2025-09-10", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { "input": 0.15, "output": 0.6 @@ -8289,13 +7615,12 @@ "type": "chat" }, { - "id": "ernie-5.0-thinking-preview", - "name": "Ernie 5.0 Thinking Preview", - "display_name": "Ernie 5.0 Thinking Preview", + "id": "KAT-Coder-Exp-72B-1010", + "name": "KAT Coder Exp 72B 1010", + "display_name": "KAT Coder Exp 72B 1010", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -8303,283 +7628,311 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 32768 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2025-10-28", + "last_updated": "2025-10-28", "cost": { - "input": 1.1, - "output": 2 + "input": 0.1, + "output": 0.2 }, "type": "chat" }, { - "id": "glm-4-air-0111", - "name": "GLM 4 Air 0111", - "display_name": "GLM 4 Air 0111", + "id": "claude-opus-4-thinking:32768", + "name": "Claude 4 Opus Thinking (32K)", + "display_name": "Claude 4 Opus Thinking (32K)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-01-11", - "last_updated": "2025-01-11", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.1394, - "output": 0.1394 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "fastgpt", - "name": "Web Answer", - "display_name": "Web Answer", + "id": "claude-sonnet-4-thinking:1024", + "name": "Claude 4 Sonnet Thinking (1K)", + "display_name": "Claude 4 Sonnet Thinking (1K)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 1000000, + "output": 64000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2023-08-01", - "last_updated": "2024-01-01", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 7.5, - "output": 7.5 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "doubao-seed-1-6-thinking-250615", - "name": "Doubao Seed 1.6 Thinking", - "display_name": "Doubao Seed 1.6 Thinking", + "id": "qwen25-vl-72b-instruct", + "name": "Qwen25 VL 72b", + "display_name": "Qwen25 VL 72b", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 32000, + "output": 32768 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-06-15", - "last_updated": "2025-06-15", + "release_date": "2025-05-10", + "last_updated": "2025-05-10", "cost": { - "input": 0.204, - "output": 2.04 + "input": 0.69989, + "output": 0.69989 }, "type": "chat" }, { - "id": "gemini-2.0-flash-001", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "brave", + "name": "Brave (Answers)", + "display_name": "Brave (Answers)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2023-03-02", + "last_updated": "2024-01-01", "cost": { - "input": 0.1003, - "output": 0.408 + "input": 5, + "output": 5 }, "type": "chat" }, { - "id": "claude-opus-4-1-thinking:32000", - "name": "Claude 4.1 Opus Thinking (32K)", - "display_name": "Claude 4.1 Opus Thinking (32K)", + "id": "azure-gpt-4-turbo", + "name": "Azure gpt-4-turbo", + "display_name": "Azure gpt-4-turbo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2023-11-06", + "last_updated": "2024-01-01", "cost": { - "input": 14.994, - "output": 75.004 + "input": 9.996, + "output": 30.005 }, "type": "chat" }, { - "id": "Llama-3.3-70B-RAWMAW", - "name": "Llama 3.3 70B RAWMAW", - "display_name": "Llama 3.3 70B RAWMAW", + "id": "ernie-5.0-thinking-latest", + "name": "Ernie 5.0 Thinking", + "display_name": "Ernie 5.0 Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 128000, "output": 16384 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1.1, + "output": 2 }, "type": "chat" }, { - "id": "GLM-4.5-Air-Derestricted-Steam", - "name": "GLM 4.5 Air Derestricted Steam", - "display_name": "GLM 4.5 Air Derestricted Steam", + "id": "claude-3-7-sonnet-thinking:32768", + "name": "Claude 3.7 Sonnet Thinking (32K)", + "display_name": "Claude 3.7 Sonnet Thinking (32K)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 220600, - "output": 65536 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-07-15", + "last_updated": "2025-07-15", "cost": { - "input": 0.306, - "output": 0.306 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "claude-3-5-sonnet-20241022", - "name": "Claude 3.5 Sonnet", - "display_name": "Claude 3.5 Sonnet", + "id": "doubao-seed-code-preview-latest", + "name": "Doubao Seed Code Preview", + "display_name": "Doubao Seed Code Preview", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 256000, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "yi-medium-200k", - "name": "Yi Medium 200k", - "display_name": "Yi Medium 200k", + "id": "Llama-3.3-70B-Cirrus-x1", + "name": "Llama 3.3 70B Cirrus x1", + "display_name": "Llama 3.3 70B Cirrus x1", "modalities": { "input": [ "text" @@ -8589,8 +7942,8 @@ ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -8598,48 +7951,49 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-03-01", - "last_updated": "2024-03-01", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 2.499, - "output": 2.499 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "Gemma-3-27B-ArliAI-RPMax-v3", - "name": "Gemma 3 27B RPMax v3", - "display_name": "Gemma 3 27B RPMax v3", + "id": "doubao-1-5-thinking-vision-pro-250428", + "name": "Doubao 1.5 Thinking Vision Pro", + "display_name": "Doubao 1.5 Thinking Vision Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 128000, "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-03", - "last_updated": "2025-07-03", + "release_date": "2025-05-15", + "last_updated": "2025-05-15", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.55, + "output": 1.43 }, "type": "chat" }, { - "id": "phi-4-mini-instruct", - "name": "Phi 4 Mini", - "display_name": "Phi 4 Mini", + "id": "qwen-turbo", + "name": "Qwen Turbo", + "display_name": "Qwen Turbo", "modalities": { "input": [ "text" @@ -8649,27 +8003,38 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.17, - "output": 0.68 + "input": 0.04998, + "output": 0.2006 }, "type": "chat" }, { - "id": "ernie-x1-32k", - "name": "Ernie X1 32k", - "display_name": "Ernie X1 32k", + "id": "gemini-2.0-flash-thinking-exp-01-21", + "name": "Gemini 2.0 Flash Thinking 0121", + "display_name": "Gemini 2.0 Flash Thinking 0121", "modalities": { "input": [ "text", @@ -8680,27 +8045,33 @@ ] }, "limit": { - "context": 32000, - "output": 16384 + "context": 1000000, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "release_date": "2025-05-08", - "last_updated": "2025-05-08", + "release_date": "2025-01-21", + "last_updated": "2025-01-21", "cost": { - "input": 0.33, - "output": 1.32 + "input": 0.306, + "output": 1.003 }, "type": "chat" }, { - "id": "deepseek-chat", - "name": "DeepSeek V3/Deepseek Chat", - "display_name": "DeepSeek V3/Deepseek Chat", + "id": "deepclaude", + "name": "DeepClaude", + "display_name": "DeepClaude", "modalities": { "input": [ "text", @@ -8714,69 +8085,69 @@ "context": 128000, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27", + "release_date": "2025-02-01", + "last_updated": "2025-02-01", "cost": { - "input": 0.25, - "output": 0.7 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "glm-z1-air", - "name": "GLM Z1 Air", - "display_name": "GLM Z1 Air", + "id": "deepseek-chat-cheaper", + "name": "DeepSeek V3/Chat Cheaper", + "display_name": "DeepSeek V3/Chat Cheaper", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 16384 + "context": 128000, + "output": 8192 }, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, "release_date": "2025-04-15", "last_updated": "2025-04-15", "cost": { - "input": 0.07, - "output": 0.07 + "input": 0.25, + "output": 0.7 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-thinking:128000", - "name": "Claude 3.7 Sonnet Thinking (128K)", - "display_name": "Claude 3.7 Sonnet Thinking (128K)", + "id": "gemini-2.5-pro-preview-06-05", + "name": "Gemini 2.5 Pro Preview 0605", + "display_name": "Gemini 2.5 Pro Preview 0605", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048756, + "output": 65536 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -8787,34 +8158,33 @@ "default_enabled": true, "mode": "budget", "budget": { - "min": 1024, + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, "unit": "tokens" }, - "interleaved": false, - "summaries": false, - "visibility": "full", + "summaries": true, + "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "cost": { - "input": 2.992, - "output": 14.994 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "glm-4-air", - "name": "GLM-4 Air", - "display_name": "GLM-4 Air", + "id": "qwen-max", + "name": "Qwen 2.5 Max", + "display_name": "Qwen 2.5 Max", "modalities": { "input": [ "text" @@ -8824,8 +8194,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 32000, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -8833,18 +8203,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-06-05", - "last_updated": "2024-06-05", + "release_date": "2024-04-03", + "last_updated": "2024-04-03", "cost": { - "input": 0.2006, - "output": 0.2006 + "input": 1.5997, + "output": 6.392 }, "type": "chat" }, { - "id": "Llama-3.3-70B-MiraiFanfare", - "name": "Llama 3.3 70b Mirai Fanfare", - "display_name": "Llama 3.3 70b Mirai Fanfare", + "id": "step-2-mini", + "name": "Step-2 Mini", + "display_name": "Step-2 Mini", "modalities": { "input": [ "text" @@ -8854,8 +8224,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 8000, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -8863,85 +8233,100 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "release_date": "2024-07-05", + "last_updated": "2024-07-05", "cost": { - "input": 0.493, - "output": 0.493 + "input": 0.2006, + "output": 0.408 }, "type": "chat" }, { - "id": "gemini-2.0-flash-thinking-exp-01-21", - "name": "Gemini 2.0 Flash Thinking 0121", - "display_name": "Gemini 2.0 Flash Thinking 0121", + "id": "Llama-3.3-70B-Electranova-v1.0", + "name": "Llama 3.3 70B Electranova v1.0", + "display_name": "Llama 3.3 70B Electranova v1.0", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-01-21", - "last_updated": "2025-01-21", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { "input": 0.306, - "output": 1.003 + "output": 0.306 }, "type": "chat" }, { - "id": "Magistral-Small-2506", - "name": "Magistral Small 2506", - "display_name": "Magistral Small 2506", + "id": "claude-3-7-sonnet-reasoner", + "name": "Claude 3.7 Sonnet Reasoner", + "display_name": "Claude 3.7 Sonnet Reasoner", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-03-29", + "last_updated": "2025-03-29", "cost": { - "input": 0.4, - "output": 1.4 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "doubao-1.5-pro-32k", - "name": "Doubao 1.5 Pro 32k", - "display_name": "Doubao 1.5 Pro 32k", + "id": "QwQ-32B-ArliAI-RpR-v1", + "name": "QwQ 32b Arli V1", + "display_name": "QwQ 32b Arli V1", "modalities": { "input": [ "text" @@ -8951,57 +8336,69 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 32768, + "output": 32768 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-01-22", - "last_updated": "2025-01-22", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0.1343, - "output": 0.3349 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "venice-uncensored:web", - "name": "Venice Uncensored Web", - "display_name": "Venice Uncensored Web", + "id": "ernie-4.5-turbo-128k", + "name": "Ernie 4.5 Turbo 128k", + "display_name": "Ernie 4.5 Turbo 128k", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 80000, + "context": 128000, "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-05-01", - "last_updated": "2024-05-01", + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "cost": { - "input": 0.4, - "output": 0.4 + "input": 0.132, + "output": 0.55 }, "type": "chat" }, { - "id": "glm-4", - "name": "GLM-4", - "display_name": "GLM-4", + "id": "deepseek-reasoner", + "name": "DeepSeek Reasoner", + "display_name": "DeepSeek Reasoner", "modalities": { "input": [ "text" @@ -9011,27 +8408,38 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 64000, + "output": 65536 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2024-01-16", - "last_updated": "2024-01-16", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 14.994, - "output": 14.994 + "input": 0.4, + "output": 1.7 }, "type": "chat" }, { - "id": "qwen-max", - "name": "Qwen 2.5 Max", - "display_name": "Qwen 2.5 Max", + "id": "glm-4-plus-0111", + "name": "GLM 4 Plus 0111", + "display_name": "GLM 4 Plus 0111", "modalities": { "input": [ "text" @@ -9041,8 +8449,8 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 128000, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -9050,22 +8458,21 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-04-03", - "last_updated": "2024-04-03", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 1.5997, - "output": 6.392 + "input": 9.996, + "output": 9.996 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b-instruct-original", - "name": "Qwen3 VL 235B A22B Instruct Original", - "display_name": "Qwen3 VL 235B A22B Instruct Original", + "id": "Llama-3.3-70B-Forgotten-Abomination-v5.0", + "name": "Llama 3.3 70B Forgotten Abomination v5.0", + "display_name": "Llama 3.3 70B Forgotten Abomination v5.0", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -9073,26 +8480,26 @@ }, "limit": { "context": 32768, - "output": 32768 + "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.5, - "output": 1.2 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "jamba-large-1.6", - "name": "Jamba Large 1.6", - "display_name": "Jamba Large 1.6", + "id": "doubao-seed-1-8-251215", + "name": "Doubao Seed 1.8", + "display_name": "Doubao Seed 1.8", "modalities": { "input": [ "text" @@ -9102,8 +8509,8 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 128000, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -9111,29 +8518,30 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-03-12", - "last_updated": "2025-03-12", + "release_date": "2025-12-15", + "last_updated": "2025-12-15", "cost": { - "input": 1.989, - "output": 7.99 + "input": 0.612, + "output": 6.12 }, "type": "chat" }, { - "id": "qwen-plus", - "name": "Qwen Plus", - "display_name": "Qwen Plus", + "id": "gemini-2.5-pro-preview-05-06", + "name": "Gemini 2.5 Pro Preview 0506", + "display_name": "Gemini 2.5 Pro Preview 0506", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 995904, - "output": 32768 + "context": 1048756, + "output": 65536 }, "tool_call": false, "reasoning": { @@ -9143,59 +8551,66 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "release_date": "2025-05-06", + "last_updated": "2025-05-06", "cost": { - "input": 0.3995, - "output": 1.2002 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "qwen25-vl-72b-instruct", - "name": "Qwen25 VL 72b", - "display_name": "Qwen25 VL 72b", + "id": "auto-model-standard", + "name": "Auto model (Standard)", + "display_name": "Auto model (Standard)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 32768 + "context": 1000000, + "output": 1000000 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-10", - "last_updated": "2025-05-10", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.69989, - "output": 0.69989 + "input": 9.996, + "output": 19.992 }, "type": "chat" }, { - "id": "claude-sonnet-4-thinking:64000", - "name": "Claude 4 Sonnet Thinking (64K)", - "display_name": "Claude 4 Sonnet Thinking (64K)", + "id": "gemini-2.5-flash-lite-preview-09-2025", + "name": "Gemini 2.5 Flash Lite Preview (09/2025)", + "display_name": "Gemini 2.5 Flash Lite Preview (09/2025)", "modalities": { "input": [ "text", @@ -9207,34 +8622,77 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 1048756, + "output": 65536 }, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "gemini-3-pro-preview", - "name": "Gemini 3 Pro", - "display_name": "Gemini 3 Pro", + "id": "sonar-deep-research", + "name": "Perplexity Deep Research", + "display_name": "Perplexity Deep Research", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 60000, + "output": 128000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-02-25", + "last_updated": "2025-02-25", + "cost": { + "input": 3.4, + "output": 13.6 + }, + "type": "chat" + }, + { + "id": "gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ "text", @@ -9248,21 +8706,23 @@ "context": 1048756, "output": 65536 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ @@ -9272,18 +8732,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 2, - "output": 12 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "GLM-4.5-Air-Derestricted-Iceblink-ReExtract", - "name": "GLM 4.5 Air Derestricted Iceblink ReExtract", - "display_name": "GLM 4.5 Air Derestricted Iceblink ReExtract", + "id": "Gemma-3-27B-Glitter", + "name": "Gemma 3 27B Glitter", + "display_name": "Gemma 3 27B Glitter", "modalities": { "input": [ "text" @@ -9293,8 +8753,8 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -9302,8 +8762,8 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-12", - "last_updated": "2025-12-12", + "release_date": "2025-03-10", + "last_updated": "2025-03-10", "cost": { "input": 0.306, "output": 0.306 @@ -9311,9 +8771,9 @@ "type": "chat" }, { - "id": "universal-summarizer", - "name": "Universal Summarizer", - "display_name": "Universal Summarizer", + "id": "Llama-3.3-70B-Vulpecula-R1", + "name": "Llama 3.3 70B Vulpecula R1", + "display_name": "Llama 3.3 70B Vulpecula R1", "modalities": { "input": [ "text" @@ -9324,7 +8784,7 @@ }, "limit": { "context": 32768, - "output": 32768 + "output": 16384 }, "tool_call": false, "reasoning": { @@ -9332,57 +8792,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2023-05-01", - "last_updated": "2024-01-01", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 30, - "output": 30 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "claude-sonnet-4-thinking:32768", - "name": "Claude 4 Sonnet Thinking (32K)", - "display_name": "Claude 4 Sonnet Thinking (32K)", + "id": "Gemma-3-27B-it-Abliterated", + "name": "Gemma 3 27B IT Abliterated", + "display_name": "Gemma 3 27B IT Abliterated", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 32768, + "output": 96000 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-07-03", + "last_updated": "2025-07-03", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.42, + "output": 0.42 }, "type": "chat" }, { - "id": "sarvan-medium", - "name": "Sarvam Medium", - "display_name": "Sarvam Medium", + "id": "Llama-3.3-70B-Dark-Ages-v0.1", + "name": "Llama 3.3 70B Dark Ages v0.1", + "display_name": "Llama 3.3 70B Dark Ages v0.1", "modalities": { "input": [ "text" @@ -9392,7 +8843,7 @@ ] }, "limit": { - "context": 128000, + "context": 32768, "output": 16384 }, "tool_call": false, @@ -9401,31 +8852,30 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.25, - "output": 0.75 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-thinking:8192", - "name": "Claude 3.7 Sonnet Thinking (8K)", - "display_name": "Claude 3.7 Sonnet Thinking (8K)", + "id": "gemini-3-pro-preview", + "name": "Gemini 3 Pro", + "display_name": "Gemini 3 Pro", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048756, + "output": 65536 }, "tool_call": true, "reasoning": { @@ -9436,88 +8886,64 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" ], - "notes": [ - "Anthropic uses thinking budget tokens" + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 2.992, - "output": 14.994 + "input": 2, + "output": 12 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-05-20", - "name": "Gemini 2.5 Flash 0520", - "display_name": "Gemini 2.5 Flash 0520", + "id": "asi1-mini", + "name": "ASI1 Mini", + "display_name": "ASI1 Mini", "modalities": { "input": [ "text", - "image" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048000, - "output": 65536 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0.15, - "output": 0.6 + "input": 1, + "output": 1 }, "type": "chat" }, { - "id": "GLM-4.5-Air-Derestricted-Iceblink-v2-ReExtract", - "name": "GLM 4.5 Air Derestricted Iceblink v2 ReExtract", - "display_name": "GLM 4.5 Air Derestricted Iceblink v2 ReExtract", + "id": "glm-4-air", + "name": "GLM-4 Air", + "display_name": "GLM-4 Air", "modalities": { "input": [ "text" @@ -9527,8 +8953,8 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 128000, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -9536,229 +8962,170 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-12", - "last_updated": "2025-12-12", + "release_date": "2024-06-05", + "last_updated": "2024-06-05", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.2006, + "output": 0.2006 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Fallen-v1", - "name": "Llama 3.3 70B Fallen v1", - "display_name": "Llama 3.3 70B Fallen v1", + "id": "kimi-thinking-preview", + "name": "Kimi Thinking Preview", + "display_name": "Kimi Thinking Preview", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 128000, "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0.306, - "output": 0.306 + "input": 31.46, + "output": 31.46 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b-thinking", - "name": "Qwen3 VL 235B A22B Thinking", - "display_name": "Qwen3 VL 235B A22B Thinking", + "id": "Meta-Llama-3-1-8B-Instruct-FP8", + "name": "Llama 3.1 8B (decentralized)", + "display_name": "Llama 3.1 8B (decentralized)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.5, - "output": 6 + "input": 0.02, + "output": 0.03 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-thinking:32768", - "name": "Claude 3.7 Sonnet Thinking (32K)", - "display_name": "Claude 3.7 Sonnet Thinking (32K)", + "id": "Llama-3.3-70B-MiraiFanfare", + "name": "Llama 3.3 70b Mirai Fanfare", + "display_name": "Llama 3.3 70b Mirai Fanfare", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-07-15", - "last_updated": "2025-07-15", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.493, + "output": 0.493 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-thinking:1024", - "name": "Claude 3.7 Sonnet Thinking (1K)", - "display_name": "Claude 3.7 Sonnet Thinking (1K)", + "id": "jamba-mini", + "name": "Jamba Mini", + "display_name": "Jamba Mini", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 256000, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.1989, + "output": 0.408 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "qwen3-vl-235b-a22b-instruct-original", + "name": "Qwen3 VL 235B A22B Instruct Original", + "display_name": "Qwen3 VL 235B A22B Instruct Original", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 32768, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.5, + "output": 1.2 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Vulpecula-R1", - "name": "Llama 3.3 70B Vulpecula R1", - "display_name": "Llama 3.3 70B Vulpecula R1", + "id": "GLM-4.5-Air-Derestricted-Steam", + "name": "GLM 4.5 Air Derestricted Steam", + "display_name": "GLM 4.5 Air Derestricted Steam", "modalities": { "input": [ "text" @@ -9768,8 +9135,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 220600, + "output": 65536 }, "tool_call": false, "reasoning": { @@ -9777,8 +9144,8 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { "input": 0.306, "output": 0.306 @@ -9786,9 +9153,9 @@ "type": "chat" }, { - "id": "claude-sonnet-4-thinking:8192", - "name": "Claude 4 Sonnet Thinking (8K)", - "display_name": "Claude 4 Sonnet Thinking (8K)", + "id": "claude-3-5-haiku-20241022", + "name": "Claude 3.5 Haiku", + "display_name": "Claude 3.5 Haiku", "modalities": { "input": [ "text", @@ -9800,34 +9167,27 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 200000, + "output": 8192 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.8, + "output": 4 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "claude-3-5-sonnet-20241022", + "name": "Claude 3.5 Sonnet", + "display_name": "Claude 3.5 Sonnet", "modalities": { "input": [ "text", @@ -9838,47 +9198,27 @@ ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 200000, + "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", "cost": { - "input": 2.5, - "output": 10 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Ignition-v0.1", - "name": "Llama 3.3 70B Ignition v0.1", - "display_name": "Llama 3.3 70B Ignition v0.1", + "id": "KAT-Coder-Pro-V1", + "name": "KAT Coder Pro V1", + "display_name": "KAT Coder Pro V1", "modalities": { "input": [ "text" @@ -9888,8 +9228,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 256000, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -9897,18 +9237,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-10-28", + "last_updated": "2025-10-28", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1.5, + "output": 6 }, "type": "chat" }, { - "id": "glm-4-plus-0111", - "name": "GLM 4 Plus 0111", - "display_name": "GLM 4 Plus 0111", + "id": "venice-uncensored:web", + "name": "Venice Uncensored Web", + "display_name": "Venice Uncensored Web", "modalities": { "input": [ "text" @@ -9918,8 +9258,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 80000, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -9927,41 +9267,44 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2024-05-01", + "last_updated": "2024-05-01", "cost": { - "input": 9.996, - "output": 9.996 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "KAT-Coder-Air-V1", - "name": "KAT Coder Air V1", - "display_name": "KAT Coder Air V1", + "id": "claude-opus-4-5-20251101", + "name": "Claude 4.5 Opus", + "display_name": "Claude 4.5 Opus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-10-28", - "last_updated": "2025-10-28", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { - "input": 0.1, - "output": 0.2 + "input": 4.998, + "output": 25.007 }, "type": "chat" }, @@ -9996,55 +9339,13 @@ "type": "chat" }, { - "id": "deepseek-r1", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", - "cost": { - "input": 0.4, - "output": 1.7 - }, - "type": "chat" - }, - { - "id": "doubao-1-5-thinking-pro-250415", - "name": "Doubao 1.5 Thinking Pro", - "display_name": "Doubao 1.5 Thinking Pro", + "id": "doubao-1-5-thinking-pro-vision-250415", + "name": "Doubao 1.5 Thinking Pro Vision", + "display_name": "Doubao 1.5 Thinking Pro Vision", "modalities": { "input": [ "text", - "pdf" + "image" ], "output": [ "text" @@ -10060,8 +9361,8 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-04-17", - "last_updated": "2025-04-17", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { "input": 0.6, "output": 2.4 @@ -10069,9 +9370,9 @@ "type": "chat" }, { - "id": "sonar-pro", - "name": "Perplexity Pro", - "display_name": "Perplexity Pro", + "id": "sarvan-medium", + "name": "Sarvam Medium", + "display_name": "Sarvam Medium", "modalities": { "input": [ "text" @@ -10081,8 +9382,8 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -10090,51 +9391,53 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.25, + "output": 0.75 }, "type": "chat" }, { - "id": "Gemma-3-27B-it-Abliterated", - "name": "Gemma 3 27B IT Abliterated", - "display_name": "Gemma 3 27B IT Abliterated", + "id": "gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "display_name": "Gemini 2.0 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 96000 + "context": 1000000, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-03", - "last_updated": "2025-07-03", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.42, - "output": 0.42 + "input": 0.0748, + "output": 0.306 }, "type": "chat" }, { - "id": "deepseek-chat-cheaper", - "name": "DeepSeek V3/Chat Cheaper", - "display_name": "DeepSeek V3/Chat Cheaper", + "id": "claude-opus-4-20250514", + "name": "Claude 4 Opus", + "display_name": "Claude 4 Opus", "modalities": { "input": [ "text", + "image", "pdf" ], "output": [ @@ -10142,8 +9445,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 32000 }, "tool_call": true, "reasoning": { @@ -10151,80 +9454,80 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "release_date": "2025-05-14", + "last_updated": "2025-05-14", "cost": { - "input": 0.25, - "output": 0.7 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "gemini-2.0-pro-exp-02-05", - "name": "Gemini 2.0 Pro 0205", - "display_name": "Gemini 2.0 Pro 0205", + "id": "learnlm-1.5-pro-experimental", + "name": "Gemini LearnLM Experimental", + "display_name": "Gemini LearnLM Experimental", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2097152, + "context": 32767, "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2025-02-05", + "release_date": "2024-05-14", + "last_updated": "2024-05-14", "cost": { - "input": 1.989, - "output": 7.956 + "input": 3.502, + "output": 10.506 }, "type": "chat" }, { - "id": "azure-gpt-4o-mini", - "name": "Azure gpt-4o-mini", - "display_name": "Azure gpt-4o-mini", + "id": "qwen-3.6-plus", + "name": "Qwen 3.6 Plus", + "display_name": "Qwen 3.6 Plus", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 991800, + "output": 65536 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.1496, - "output": 0.595 + "input": 0.45, + "output": 2.7 }, "type": "chat" }, { - "id": "Llama-3.3-70B-MS-Nevoria", - "name": "Llama 3.3 70B MS Nevoria", - "display_name": "Llama 3.3 70B MS Nevoria", + "id": "yi-large", + "name": "Yi Large", + "display_name": "Yi Large", "modalities": { "input": [ "text" @@ -10234,8 +9537,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 32000, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -10243,57 +9546,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0.306, - "output": 0.306 + "input": 3.196, + "output": 3.196 }, "type": "chat" }, { - "id": "claude-opus-4-thinking", - "name": "Claude 4 Opus Thinking", - "display_name": "Claude 4 Opus Thinking", + "id": "Baichuan-M2", + "name": "Baichuan M2 32B Medical", + "display_name": "Baichuan M2 32B Medical", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 32768, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-07-15", - "last_updated": "2025-07-15", + "release_date": "2025-08-19", + "last_updated": "2025-08-19", "cost": { - "input": 14.994, - "output": 75.004 + "input": 15.73, + "output": 15.73 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Sapphira-0.1", - "name": "Llama 3.3 70B Sapphira 0.1", - "display_name": "Llama 3.3 70B Sapphira 0.1", + "id": "Llama-3.3-70B-ArliAI-RPMax-v2", + "name": "Llama 3.3 70B ArliAI RPMax v2", + "display_name": "Llama 3.3 70B ArliAI RPMax v2", "modalities": { "input": [ "text" @@ -10312,8 +9606,8 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { "input": 0.306, "output": 0.306 @@ -10321,9 +9615,9 @@ "type": "chat" }, { - "id": "doubao-seed-code-preview-latest", - "name": "Doubao Seed Code Preview", - "display_name": "Doubao Seed Code Preview", + "id": "glm-4-air-0111", + "name": "GLM 4 Air 0111", + "display_name": "GLM 4 Air 0111", "modalities": { "input": [ "text" @@ -10333,83 +9627,52 @@ ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 128000, + "output": 4096 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-01-11", + "last_updated": "2025-01-11", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.1394, + "output": 0.1394 }, "type": "chat" }, { - "id": "qwen-3.6-plus", - "name": "Qwen 3.6 Plus", - "display_name": "Qwen 3.6 Plus", + "id": "claude-sonnet-4-5-20250929", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", "image", - "video" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 991800, - "output": 65536 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", - "cost": { - "input": 0.45, - "output": 2.7 - }, - "type": "chat" - }, - { - "id": "Llama-3.3-70B-ArliAI-RPMax-v1.4", - "name": "Llama 3.3 70B RPMax v1.4", - "display_name": "Llama 3.3 70B RPMax v1.4", - "modalities": { - "input": [ - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 1000000, + "output": 64000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.306, - "output": 0.306 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, @@ -10445,40 +9708,39 @@ "type": "chat" }, { - "id": "glm-4.1v-thinking-flashx", - "name": "GLM 4.1V Thinking FlashX", - "display_name": "GLM 4.1V Thinking FlashX", + "id": "grok-3-mini-fast-beta", + "name": "Grok 3 Mini Fast Beta", + "display_name": "Grok 3 Mini Fast Beta", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 8192 + "context": 131072, + "output": 131072 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0.3, - "output": 0.3 + "input": 0.6, + "output": 4 }, "type": "chat" }, { - "id": "hunyuan-t1-latest", - "name": "Hunyuan T1", - "display_name": "Hunyuan T1", + "id": "deepseek-reasoner-cheaper", + "name": "Deepseek R1 Cheaper", + "display_name": "Deepseek R1 Cheaper", "modalities": { "input": [ "text" @@ -10488,8 +9750,8 @@ ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 128000, + "output": 65536 }, "tool_call": false, "reasoning": { @@ -10497,52 +9759,52 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-03-22", - "last_updated": "2025-03-22", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.17, - "output": 0.66 + "input": 0.4, + "output": 1.7 }, "type": "chat" }, { - "id": "doubao-1-5-thinking-vision-pro-250428", - "name": "Doubao 1.5 Thinking Vision Pro", - "display_name": "Doubao 1.5 Thinking Vision Pro", + "id": "Llama-3.3-70B-Aurora-Borealis", + "name": "Llama 3.3 70B Aurora Borealis", + "display_name": "Llama 3.3 70B Aurora Borealis", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 32768, "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-15", - "last_updated": "2025-05-15", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.55, - "output": 1.43 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "asi1-mini", - "name": "ASI1 Mini", - "display_name": "ASI1 Mini", + "id": "claude-opus-4-thinking", + "name": "Claude 4 Opus Thinking", + "display_name": "Claude 4 Opus Thinking", "modalities": { "input": [ "text", + "image", "pdf" ], "output": [ @@ -10550,27 +9812,34 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } }, "attachment": true, "open_weights": false, - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "release_date": "2025-07-15", + "last_updated": "2025-07-15", "cost": { - "input": 1, - "output": 1 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "ernie-5.0-thinking-latest", - "name": "Ernie 5.0 Thinking", - "display_name": "Ernie 5.0 Thinking", + "id": "gemini-2.0-flash-001", + "name": "Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", "modalities": { "input": [ "text", @@ -10581,28 +9850,27 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 1.1, - "output": 2 + "input": 0.1003, + "output": 0.408 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Incandescent-Malevolence", - "name": "Llama 3.3 70B Incandescent Malevolence", - "display_name": "Llama 3.3 70B Incandescent Malevolence", + "id": "Gemma-3-27B-ArliAI-RPMax-v3", + "name": "Gemma 3 27B RPMax v3", + "display_name": "Gemma 3 27B RPMax v3", "modalities": { "input": [ "text" @@ -10621,8 +9889,8 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-07-03", + "last_updated": "2025-07-03", "cost": { "input": 0.306, "output": 0.306 @@ -10630,69 +9898,89 @@ "type": "chat" }, { - "id": "Llama-3.3-70B-Damascus-R1", - "name": "Damascus R1", - "display_name": "Damascus R1", + "id": "azure-gpt-4o", + "name": "Azure gpt-4o", + "display_name": "Azure gpt-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 128000, "output": 16384 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0.306, - "output": 0.306 + "input": 2.499, + "output": 9.996 }, "type": "chat" }, { - "id": "Gemma-3-27B-Nidum-Uncensored", - "name": "Gemma 3 27B Nidum Uncensored", - "display_name": "Gemma 3 27B Nidum Uncensored", + "id": "gemini-3-pro-preview-thinking", + "name": "Gemini 3 Pro Thinking", + "display_name": "Gemini 3 Pro Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 96000 + "context": 1048756, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.306, - "output": 0.306 + "input": 2, + "output": 12 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-09-2025-thinking", - "name": "Gemini 2.5 Flash Lite Preview (09/2025) – Thinking", - "display_name": "Gemini 2.5 Flash Lite Preview (09/2025) – Thinking", + "id": "claude-3-7-sonnet-thinking", + "name": "Claude 3.7 Sonnet Thinking", + "display_name": "Claude 3.7 Sonnet Thinking", "modalities": { "input": [ "text", @@ -10704,77 +9992,87 @@ ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 200000, + "output": 16000 }, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "budget", "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, + "min": 1024, "unit": "tokens" }, - "summaries": true, - "visibility": "summary", + "interleaved": false, + "summaries": false, + "visibility": "full", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 0.1, - "output": 0.4 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "doubao-seed-2-0-pro-260215", - "name": "Doubao Seed 2.0 Pro", - "display_name": "Doubao Seed 2.0 Pro", + "id": "claude-opus-4-1-thinking:1024", + "name": "Claude 4.1 Opus Thinking (1K)", + "display_name": "Claude 4.1 Opus Thinking (1K)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.782, - "output": 3.876 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "gemini-3-pro-image-preview", - "name": "Gemini 3 Pro Image", - "display_name": "Gemini 3 Pro Image", + "id": "gemini-2.5-flash-preview-05-20:thinking", + "name": "Gemini 2.5 Flash 0520 Thinking", + "display_name": "Gemini 2.5 Flash 0520 Thinking", "modalities": { "input": [ "text", @@ -10785,7 +10083,7 @@ ] }, "limit": { - "context": 1048756, + "context": 1048000, "output": 65536 }, "tool_call": false, @@ -10797,12 +10095,15 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ @@ -10812,78 +10113,88 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 2, - "output": 12 + "input": 0.15, + "output": 3.5 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "Gemma-3-27B-CardProjector-v4", - "name": "Gemma 3 27B CardProjector v4", - "display_name": "Gemma 3 27B CardProjector v4", + "id": "claude-opus-4-thinking:1024", + "name": "Claude 4 Opus Thinking (1K)", + "display_name": "Claude 4 Opus Thinking (1K)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.306, - "output": 0.306 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "jamba-mini-1.7", - "name": "Jamba Mini 1.7", - "display_name": "Jamba Mini 1.7", + "id": "doubao-1.5-vision-pro-32k", + "name": "Doubao 1.5 Vision Pro 32k", + "display_name": "Doubao 1.5 Vision Pro 32k", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 32000, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2025-01-22", + "last_updated": "2025-01-22", "cost": { - "input": 0.1989, - "output": 0.408 + "input": 0.459, + "output": 1.377 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Forgotten-Safeword-3.6", - "name": "Llama 3.3 70B Forgotten Safeword 3.6", - "display_name": "Llama 3.3 70B Forgotten Safeword 3.6", + "id": "Llama-3.3-70B-Fallen-R1-v1", + "name": "Llama 3.3 70B Fallen R1 v1", + "display_name": "Llama 3.3 70B Fallen R1 v1", "modalities": { "input": [ "text" @@ -10911,9 +10222,9 @@ "type": "chat" }, { - "id": "doubao-1-5-thinking-pro-vision-250415", - "name": "Doubao 1.5 Thinking Pro Vision", - "display_name": "Doubao 1.5 Thinking Pro Vision", + "id": "glm-4.1v-thinking-flash", + "name": "GLM 4.1V Thinking Flash", + "display_name": "GLM 4.1V Thinking Flash", "modalities": { "input": [ "text", @@ -10924,8 +10235,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 64000, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -10933,69 +10244,48 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.6, - "output": 2.4 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "gemini-2.5-pro-preview-06-05", - "name": "Gemini 2.5 Pro Preview 0605", - "display_name": "Gemini 2.5 Pro Preview 0605", + "id": "gemini-2.0-flash-thinking-exp-1219", + "name": "Gemini 2.0 Flash Thinking 1219", + "display_name": "Gemini 2.0 Flash Thinking 1219", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 32767, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "release_date": "2024-12-19", + "last_updated": "2024-12-19", "cost": { - "input": 2.5, - "output": 10 + "input": 0.1003, + "output": 0.408 }, "type": "chat" }, { - "id": "gemini-2.0-pro-reasoner", - "name": "Gemini 2.0 Pro Reasoner", - "display_name": "Gemini 2.0 Pro Reasoner", + "id": "Llama-3.3-70B-Magnum-v4-SE-Cirrus-x1-SLERP", + "name": "Llama 3.3 70B Magnum v4 SE Cirrus x1 SLERP", + "display_name": "Llama 3.3 70B Magnum v4 SE Cirrus x1 SLERP", "modalities": { "input": [ "text" @@ -11005,8 +10295,8 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -11014,46 +10304,42 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2025-02-05", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 1.292, - "output": 4.998 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "doubao-seed-2-0-lite-260215", - "name": "Doubao Seed 2.0 Lite", - "display_name": "Doubao Seed 2.0 Lite", + "id": "grok-3-fast-beta", + "name": "Grok 3 Fast Beta", + "display_name": "Grok 3 Fast Beta", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 131072, + "output": 131072 }, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0.1462, - "output": 0.8738 + "input": 5, + "output": 25 }, "type": "chat" }, @@ -11109,39 +10395,40 @@ "type": "chat" }, { - "id": "sonar-deep-research", - "name": "Perplexity Deep Research", - "display_name": "Perplexity Deep Research", + "id": "study_gpt-chatgpt-4o-latest", + "name": "Study Mode", + "display_name": "Study Mode", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 60000, - "output": 128000 + "context": 200000, + "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-02-25", - "last_updated": "2025-02-25", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 3.4, - "output": 13.6 + "input": 4.998, + "output": 14.994 }, "type": "chat" }, { - "id": "Gemma-3-27B-it", - "name": "Gemma 3 27B IT", - "display_name": "Gemma 3 27B IT", + "id": "Llama-3.3-70B-ArliAI-RPMax-v3", + "name": "Llama 3.3 70B ArliAI RPMax v3", + "display_name": "Llama 3.3 70B ArliAI RPMax v3", "modalities": { "input": [ "text" @@ -11160,8 +10447,8 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { "input": 0.306, "output": 0.306 @@ -11169,39 +10456,40 @@ "type": "chat" }, { - "id": "Llama-3.3-70B-GeneticLemonade-Unleashed-v3", - "name": "Llama 3.3 70B GeneticLemonade Unleashed v3", - "display_name": "Llama 3.3 70B GeneticLemonade Unleashed v3", + "id": "qwen-long", + "name": "Qwen Long 10M", + "display_name": "Qwen Long 10M", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 10000000, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-01-25", + "last_updated": "2025-01-25", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.1003, + "output": 0.408 }, "type": "chat" }, { - "id": "Gemma-3-27B-Glitter", - "name": "Gemma 3 27B Glitter", - "display_name": "Gemma 3 27B Glitter", + "id": "Baichuan4-Air", + "name": "Baichuan 4 Air", + "display_name": "Baichuan 4 Air", "modalities": { "input": [ "text" @@ -11212,7 +10500,7 @@ }, "limit": { "context": 32768, - "output": 16384 + "output": 32768 }, "tool_call": false, "reasoning": { @@ -11220,18 +10508,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", + "release_date": "2025-08-19", + "last_updated": "2025-08-19", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.157, + "output": 0.157 }, "type": "chat" }, { - "id": "Llama-3.3-70B-The-Omega-Directive-Unslop-v2.1", - "name": "Llama 3.3 70B Omega Directive Unslop v2.1", - "display_name": "Llama 3.3 70B Omega Directive Unslop v2.1", + "id": "gemini-2.0-flash-exp-image-generation", + "name": "Gemini Text + Image", + "display_name": "Gemini Text + Image", "modalities": { "input": [ "text" @@ -11241,8 +10529,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 32767, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -11250,18 +10538,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "qwen3-30b-a3b-instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", + "id": "v0-1.5-lg", + "name": "v0 1.5 LG", + "display_name": "v0 1.5 LG", "modalities": { "input": [ "text" @@ -11271,8 +10559,8 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 1000000, + "output": 64000 }, "tool_call": false, "reasoning": { @@ -11280,85 +10568,63 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-20", - "last_updated": "2025-02-20", + "release_date": "2025-07-04", + "last_updated": "2025-07-04", "cost": { - "input": 0.2, - "output": 0.5 + "input": 15, + "output": 75 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-09-2025-thinking", - "name": "Gemini 2.5 Flash Preview (09/2025) – Thinking", - "display_name": "Gemini 2.5 Flash Preview (09/2025) – Thinking", + "id": "yi-medium-200k", + "name": "Yi Medium 200k", + "display_name": "Yi Medium 200k", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 200000, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2024-03-01", + "last_updated": "2024-03-01", "cost": { - "input": 0.3, - "output": 2.5 + "input": 2.499, + "output": 2.499 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "claude-opus-4-1-thinking", + "name": "Claude 4.1 Opus Thinking", + "display_name": "Claude 4.1 Opus Thinking", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -11366,37 +10632,23 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "default_enabled": true } }, "attachment": true, "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.3, - "output": 2.5 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "deepclaude", - "name": "DeepClaude", - "display_name": "DeepClaude", + "id": "Mistral-Nemo-12B-Instruct-2407", + "name": "Mistral Nemo 12B Instruct 2407", + "display_name": "Mistral Nemo 12B Instruct 2407", "modalities": { "input": [ "text", @@ -11407,8 +10659,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -11416,18 +10668,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-02-01", - "last_updated": "2025-02-01", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 3, - "output": 15 + "input": 0.01, + "output": 0.01 }, "type": "chat" }, { - "id": "ernie-4.5-8k-preview", - "name": "Ernie 4.5 8k Preview", - "display_name": "Ernie 4.5 8k Preview", + "id": "yi-lightning", + "name": "Yi Lightning", + "display_name": "Yi Lightning", "modalities": { "input": [ "text" @@ -11437,8 +10689,8 @@ ] }, "limit": { - "context": 8000, - "output": 16384 + "context": 12000, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -11446,18 +10698,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "release_date": "2024-10-16", + "last_updated": "2024-10-16", "cost": { - "input": 0.66, - "output": 2.6 + "input": 0.2006, + "output": 0.2006 }, "type": "chat" }, { - "id": "doubao-seed-2-0-mini-260215", - "name": "Doubao Seed 2.0 Mini", - "display_name": "Doubao Seed 2.0 Mini", + "id": "sonar-reasoning-pro", + "name": "Perplexity Reasoning Pro", + "display_name": "Perplexity Reasoning Pro", "modalities": { "input": [ "text" @@ -11467,39 +10719,41 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 127000, + "output": 128000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.0493, - "output": 0.4845 + "input": 2.006, + "output": 7.9985 }, "type": "chat" }, { - "id": "gemini-3-pro-preview-thinking", - "name": "Gemini 3 Pro Thinking", - "display_name": "Gemini 3 Pro Thinking", + "id": "claude-sonnet-4-thinking:8192", + "name": "Claude 4 Sonnet Thinking (8K)", + "display_name": "Claude 4 Sonnet Thinking (8K)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 1000000, + "output": 64000 }, "tool_call": true, "reasoning": { @@ -11509,34 +10763,23 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "default_enabled": true } }, "attachment": true, "open_weights": false, - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 2, - "output": 12 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "Llama-3.3-70B-GeneticLemonade-Opus", - "name": "Llama 3.3 70B GeneticLemonade Opus", - "display_name": "Llama 3.3 70B GeneticLemonade Opus", + "id": "azure-o3-mini", + "name": "Azure o3-mini", + "display_name": "Azure o3-mini", "modalities": { "input": [ "text" @@ -11546,8 +10789,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 200000, + "output": 65536 }, "tool_call": false, "reasoning": { @@ -11555,18 +10798,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1.088, + "output": 4.3996 }, "type": "chat" }, { - "id": "v0-1.5-lg", - "name": "v0 1.5 LG", - "display_name": "v0 1.5 LG", + "id": "Llama-3.3-70B-Argunaut-1-SFT", + "name": "Llama 3.3 70B Argunaut 1 SFT", + "display_name": "Llama 3.3 70B Argunaut 1 SFT", "modalities": { "input": [ "text" @@ -11576,8 +10819,8 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -11585,49 +10828,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-04", - "last_updated": "2025-07-04", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 15, - "output": 75 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "ernie-4.5-turbo-128k", - "name": "Ernie 4.5 Turbo 128k", - "display_name": "Ernie 4.5 Turbo 128k", + "id": "Llama-3.3-70B-Mhnnn-x1", + "name": "Llama 3.3 70B Mhnnn x1", + "display_name": "Llama 3.3 70B Mhnnn x1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 32768, "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-08", - "last_updated": "2025-05-08", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.132, - "output": 0.55 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "KAT-Coder-Pro-V1", - "name": "KAT Coder Pro V1", - "display_name": "KAT Coder Pro V1", + "id": "Llama-3.3-70B-ArliAI-RPMax-v1.4", + "name": "Llama 3.3 70B RPMax v1.4", + "display_name": "Llama 3.3 70B RPMax v1.4", "modalities": { "input": [ "text" @@ -11637,8 +10879,8 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -11646,89 +10888,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-10-28", - "last_updated": "2025-10-28", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 1.5, - "output": 6 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "claude-3-5-sonnet-20240620", - "name": "Claude 3.5 Sonnet Old", - "display_name": "Claude 3.5 Sonnet Old", + "id": "Gemma-3-27B-it", + "name": "Gemma 3 27B IT", + "display_name": "Gemma 3 27B IT", "modalities": { "input": [ - "text", - "image", - "pdf" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 200000, - "output": 8192 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2024-06-20", - "last_updated": "2024-06-20", - "cost": { - "input": 2.992, - "output": 14.994 - }, - "type": "chat" - }, - { - "id": "claude-opus-4-1-thinking:8192", - "name": "Claude 4.1 Opus Thinking (8K)", - "display_name": "Claude 4.1 Opus Thinking (8K)", - "modalities": { - "input": [ - "text", - "image", - "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 32768, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-03-10", + "last_updated": "2025-03-10", "cost": { - "input": 14.994, - "output": 75.004 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "gemini-2.0-flash-exp-image-generation", - "name": "Gemini Text + Image", - "display_name": "Gemini Text + Image", + "id": "GLM-4.5-Air-Derestricted", + "name": "GLM 4.5 Air Derestricted", + "display_name": "GLM 4.5 Air Derestricted", "modalities": { "input": [ "text" @@ -11738,8 +10939,8 @@ ] }, "limit": { - "context": 32767, - "output": 8192 + "context": 202600, + "output": 98304 }, "tool_call": false, "reasoning": { @@ -11747,18 +10948,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Magnum-v4-SE", - "name": "Llama 3.3 70B Magnum v4 SE", - "display_name": "Llama 3.3 70B Magnum v4 SE", + "id": "Baichuan4-Turbo", + "name": "Baichuan 4 Turbo", + "display_name": "Baichuan 4 Turbo", "modalities": { "input": [ "text" @@ -11768,8 +10969,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -11777,18 +10978,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-08-19", + "last_updated": "2025-08-19", "cost": { - "input": 0.306, - "output": 0.306 + "input": 2.42, + "output": 2.42 }, "type": "chat" }, { - "id": "glm-zero-preview", - "name": "GLM Zero Preview", - "display_name": "GLM Zero Preview", + "id": "jamba-mini-1.6", + "name": "Jamba Mini 1.6", + "display_name": "Jamba Mini 1.6", "modalities": { "input": [ "text" @@ -11798,7 +10999,7 @@ ] }, "limit": { - "context": 8000, + "context": 256000, "output": 4096 }, "tool_call": false, @@ -11807,18 +11008,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 1.802, - "output": 1.802 + "input": 0.1989, + "output": 0.408 }, "type": "chat" }, { - "id": "study_gpt-chatgpt-4o-latest", - "name": "Study Mode", - "display_name": "Study Mode", + "id": "qvq-max", + "name": "Qwen: QvQ Max", + "display_name": "Qwen: QvQ Max", "modalities": { "input": [ "text", @@ -11829,8 +11030,8 @@ ] }, "limit": { - "context": 200000, - "output": 16384 + "context": 128000, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -11838,18 +11039,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "release_date": "2025-03-28", + "last_updated": "2025-03-28", "cost": { - "input": 4.998, - "output": 14.994 + "input": 1.4, + "output": 5.3 }, "type": "chat" }, { - "id": "glm-4-airx", - "name": "GLM-4 AirX", - "display_name": "GLM-4 AirX", + "id": "MiniMax-M1", + "name": "MiniMax M1", + "display_name": "MiniMax M1", "modalities": { "input": [ "text" @@ -11859,8 +11060,8 @@ ] }, "limit": { - "context": 8000, - "output": 4096 + "context": 1000000, + "output": 131072 }, "tool_call": false, "reasoning": { @@ -11868,18 +11069,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-06-05", - "last_updated": "2024-06-05", + "release_date": "2025-06-16", + "last_updated": "2025-06-16", "cost": { - "input": 2.006, - "output": 2.006 + "input": 0.1394, + "output": 1.3328 }, "type": "chat" }, { - "id": "step-2-mini", - "name": "Step-2 Mini", - "display_name": "Step-2 Mini", + "id": "qwen3.6-max-preview", + "name": "Qwen3.6 Max Preview", + "display_name": "Qwen3.6 Max Preview", "modalities": { "input": [ "text" @@ -11889,27 +11090,38 @@ ] }, "limit": { - "context": 8000, - "output": 4096 + "context": 245800, + "output": 65536 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2024-07-05", - "last_updated": "2024-07-05", + "release_date": "2026-04-20", + "last_updated": "2026-04-21", "cost": { - "input": 0.2006, - "output": 0.408 + "input": 1.3, + "output": 7.8 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-04-17:thinking", - "name": "Gemini 2.5 Flash Preview Thinking", - "display_name": "Gemini 2.5 Flash Preview Thinking", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", @@ -11950,48 +11162,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-04-17", - "last_updated": "2025-04-17", - "cost": { - "input": 0.15, - "output": 3.5 - }, - "type": "chat" - }, - { - "id": "Llama-3.3-70B-Mokume-Gane-R1", - "name": "Llama 3.3 70B Mokume Gane R1", - "display_name": "Llama 3.3 70B Mokume Gane R1", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32768, - "output": 16384 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "deepseek-reasoner", - "name": "DeepSeek Reasoner", - "display_name": "DeepSeek Reasoner", + "id": "qwen3-max-2026-01-23", + "name": "Qwen3 Max 2026-01-23", + "display_name": "Qwen3 Max 2026-01-23", "modalities": { "input": [ "text" @@ -12001,8 +11183,8 @@ ] }, "limit": { - "context": 64000, - "output": 65536 + "context": 256000, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -12021,18 +11203,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2026-01-26", + "last_updated": "2026-01-26", "cost": { - "input": 0.4, - "output": 1.7 + "input": 1.2002, + "output": 6.001 }, "type": "chat" }, { - "id": "glm-z1-airx", - "name": "GLM Z1 AirX", - "display_name": "GLM Z1 AirX", + "id": "Gemma-3-27B-Nidum-Uncensored", + "name": "Gemma 3 27B Nidum Uncensored", + "display_name": "Gemma 3 27B Nidum Uncensored", "modalities": { "input": [ "text" @@ -12042,27 +11224,27 @@ ] }, "limit": { - "context": 32000, - "output": 16384 + "context": 32768, + "output": 96000 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 0.7, - "output": 0.7 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "jamba-mini-1.6", - "name": "Jamba Mini 1.6", - "display_name": "Jamba Mini 1.6", + "id": "GLM-4.6-Derestricted-v5", + "name": "GLM 4.6 Derestricted v5", + "display_name": "GLM 4.6 Derestricted v5", "modalities": { "input": [ "text" @@ -12072,8 +11254,8 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 131072, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -12081,57 +11263,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.1989, - "output": 0.408 + "input": 0.4, + "output": 1.5 }, "type": "chat" }, { - "id": "claude-opus-4-1-thinking", - "name": "Claude 4.1 Opus Thinking", - "display_name": "Claude 4.1 Opus Thinking", + "id": "glm-4-airx", + "name": "GLM-4 AirX", + "display_name": "GLM-4 AirX", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 8000, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2024-06-05", + "last_updated": "2024-06-05", "cost": { - "input": 14.994, - "output": 75.004 + "input": 2.006, + "output": 2.006 }, "type": "chat" }, { - "id": "grok-3-beta", - "name": "Grok 3 Beta", - "display_name": "Grok 3 Beta", + "id": "doubao-seed-1-6-flash-250615", + "name": "Doubao Seed 1.6 Flash", + "display_name": "Doubao Seed 1.6 Flash", "modalities": { "input": [ "text" @@ -12141,8 +11314,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -12150,18 +11323,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-06-15", + "last_updated": "2025-06-15", "cost": { - "input": 3, - "output": 15 + "input": 0.0374, + "output": 0.374 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Legion-V2.1", - "name": "Llama 3.3 70B Legion V2.1", - "display_name": "Llama 3.3 70B Legion V2.1", + "id": "brave-pro", + "name": "Brave (Pro)", + "display_name": "Brave (Pro)", "modalities": { "input": [ "text" @@ -12171,8 +11344,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -12180,18 +11353,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2023-03-02", + "last_updated": "2024-01-01", "cost": { - "input": 0.306, - "output": 0.306 + "input": 5, + "output": 5 }, "type": "chat" }, { - "id": "sonar", - "name": "Perplexity Simple", - "display_name": "Perplexity Simple", + "id": "Llama-3.3-70B-Sapphira-0.1", + "name": "Llama 3.3 70B Sapphira 0.1", + "display_name": "Llama 3.3 70B Sapphira 0.1", "modalities": { "input": [ "text" @@ -12201,8 +11374,8 @@ ] }, "limit": { - "context": 127000, - "output": 128000 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -12210,45 +11383,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 1.003, - "output": 1.003 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "z-image-turbo", - "name": "Z Image Turbo", - "display_name": "Z Image Turbo", + "id": "Llama-3.3-70B-Incandescent-Malevolence", + "name": "Llama 3.3 70B Incandescent Malevolence", + "display_name": "Llama 3.3 70B Incandescent Malevolence", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 32768, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-27", - "last_updated": "2025-11-27", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.306, + "output": 0.306 + }, "type": "chat" }, { - "id": "GLM-4.5-Air-Derestricted-Iceblink-v2", - "name": "GLM 4.5 Air Derestricted Iceblink v2", - "display_name": "GLM 4.5 Air Derestricted Iceblink v2", + "id": "gemini-2.0-pro-reasoner", + "name": "Gemini 2.0 Pro Reasoner", + "display_name": "Gemini 2.0 Pro Reasoner", "modalities": { "input": [ "text" @@ -12258,7 +11434,7 @@ ] }, "limit": { - "context": 158600, + "context": 128000, "output": 65536 }, "tool_call": false, @@ -12267,18 +11443,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-02-05", + "last_updated": "2025-02-05", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1.292, + "output": 4.998 }, "type": "chat" }, { - "id": "jamba-large", - "name": "Jamba Large", - "display_name": "Jamba Large", + "id": "hunyuan-turbos-20250226", + "name": "Hunyuan Turbo S", + "display_name": "Hunyuan Turbo S", "modalities": { "input": [ "text" @@ -12288,8 +11464,8 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 24000, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -12297,162 +11473,139 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2025-02-27", + "last_updated": "2025-02-27", "cost": { - "input": 1.989, - "output": 7.99 + "input": 0.187, + "output": 0.374 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-reasoner", - "name": "Claude 3.7 Sonnet Reasoner", - "display_name": "Claude 3.7 Sonnet Reasoner", + "id": "doubao-1.5-pro-32k", + "name": "Doubao 1.5 Pro 32k", + "display_name": "Doubao 1.5 Pro 32k", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 32000, "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-03-29", - "last_updated": "2025-03-29", + "release_date": "2025-01-22", + "last_updated": "2025-01-22", "cost": { - "input": 3, - "output": 15 + "input": 0.1343, + "output": 0.3349 }, "type": "chat" }, { - "id": "ernie-4.5-turbo-vl-32k", - "name": "Ernie 4.5 Turbo VL 32k", - "display_name": "Ernie 4.5 Turbo VL 32k", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 16384 + "context": 128000, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-08", - "last_updated": "2025-05-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.495, - "output": 1.43 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "Mistral-Nemo-12B-Instruct-2407", - "name": "Mistral Nemo 12B Instruct 2407", - "display_name": "Mistral Nemo 12B Instruct 2407", + "id": "Llama-3.3-70B-MS-Nevoria", + "name": "Llama 3.3 70B MS Nevoria", + "display_name": "Llama 3.3 70B MS Nevoria", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 16384, + "context": 32768, "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.01, - "output": 0.01 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "doubao-seed-1-6-flash-250615", - "name": "Doubao Seed 1.6 Flash", - "display_name": "Doubao Seed 1.6 Flash", + "id": "ernie-x1-32k", + "name": "Ernie X1 32k", + "display_name": "Ernie X1 32k", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 32000, "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-06-15", - "last_updated": "2025-06-15", + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "cost": { - "input": 0.0374, - "output": 0.374 + "input": 0.33, + "output": 1.32 }, "type": "chat" }, { - "id": "qwq-32b", - "name": "Qwen: QwQ 32B", - "display_name": "Qwen: QwQ 32B", + "id": "auto-model", + "name": "Auto model", + "display_name": "Auto model", "modalities": { "input": [ "text" @@ -12462,82 +11615,73 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1000000, + "output": 1000000 }, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.25599999, - "output": 0.30499999 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Strawberrylemonade-v1.2", - "name": "Llama 3.3 70B StrawberryLemonade v1.2", - "display_name": "Llama 3.3 70B StrawberryLemonade v1.2", + "id": "azure-gpt-4o-mini", + "name": "Azure gpt-4o-mini", + "display_name": "Azure gpt-4o-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 128000, "output": 16384 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.1496, + "output": 0.595 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-04-17", - "name": "Gemini 2.5 Flash Preview", - "display_name": "Gemini 2.5 Flash Preview", + "id": "claude-3-7-sonnet-thinking:128000", + "name": "Claude 3.7 Sonnet Thinking (128K)", + "display_name": "Claude 3.7 Sonnet Thinking (128K)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -12548,34 +11692,34 @@ "default_enabled": true, "mode": "budget", "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, + "min": 1024, "unit": "tokens" }, - "summaries": true, - "visibility": "summary", + "interleaved": false, + "summaries": false, + "visibility": "full", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-04-17", - "last_updated": "2025-04-17", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 0.15, - "output": 0.6 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "ernie-x1-turbo-32k", - "name": "Ernie X1 Turbo 32k", - "display_name": "Ernie X1 Turbo 32k", + "id": "claude-opus-4-thinking:8192", + "name": "Claude 4 Opus Thinking (8K)", + "display_name": "Claude 4 Opus Thinking (8K)", "modalities": { "input": [ "text", @@ -12587,62 +11731,34 @@ ] }, "limit": { - "context": 32000, - "output": 16384 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-08", - "last_updated": "2025-05-08", - "cost": { - "input": 0.165, - "output": 0.66 - }, - "type": "chat" - }, - { - "id": "deepseek-math-v2", - "name": "DeepSeek Math V2", - "display_name": "DeepSeek Math V2", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 65536 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-03", - "last_updated": "2025-12-03", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.6, - "output": 2.2 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Electranova-v1.0", - "name": "Llama 3.3 70B Electranova v1.0", - "display_name": "Llama 3.3 70B Electranova v1.0", + "id": "glm-z1-air", + "name": "GLM Z1 Air", + "display_name": "GLM Z1 Air", "modalities": { "input": [ "text" @@ -12652,85 +11768,80 @@ ] }, "limit": { - "context": 32768, + "context": 32000, "output": 16384 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.07, + "output": 0.07 }, "type": "chat" }, { - "id": "Llama-3.3-70B-ArliAI-RPMax-v2", - "name": "Llama 3.3 70B ArliAI RPMax v2", - "display_name": "Llama 3.3 70B ArliAI RPMax v2", + "id": "claude-3-7-sonnet-20250219", + "name": "Claude 3.7 Sonnet", + "display_name": "Claude 3.7 Sonnet", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 200000, + "output": 16000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.306, - "output": 0.306 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "qwen-image", - "name": "Qwen Image", - "display_name": "Qwen Image", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "type": "imageGeneration" - }, - { - "id": "Llama-3.3-70B-Cu-Mai-R1", - "name": "Llama 3.3 70B Cu Mai R1", - "display_name": "Llama 3.3 70B Cu Mai R1", + "id": "Gemma-3-27B-Big-Tiger-v3", + "name": "Gemma 3 27B Big Tiger v3", + "display_name": "Gemma 3 27B Big Tiger v3", "modalities": { "input": [ "text" @@ -12749,8 +11860,8 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { "input": 0.306, "output": 0.306 @@ -12758,12 +11869,13 @@ "type": "chat" }, { - "id": "GLM-4.5-Air-Derestricted-Iceblink", - "name": "GLM 4.5 Air Derestricted Iceblink", - "display_name": "GLM 4.5 Air Derestricted Iceblink", + "id": "kimi-k2-instruct-fast", + "name": "Kimi K2 0711 Fast", + "display_name": "Kimi K2 0711 Fast", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" @@ -12771,56 +11883,79 @@ }, "limit": { "context": 131072, - "output": 98304 + "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-07-15", + "last_updated": "2025-07-15", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.1, + "output": 2 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Bigger-Body", - "name": "Llama 3.3 70B Bigger Body", - "display_name": "Llama 3.3 70B Bigger Body", + "id": "gemini-2.5-flash-nothinking", + "name": "Gemini 2.5 Flash (No Thinking)", + "display_name": "Gemini 2.5 Flash (No Thinking)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 1048756, + "output": 65536 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "hunyuan-turbos-20250226", - "name": "Hunyuan Turbo S", - "display_name": "Hunyuan Turbo S", + "id": "phi-4-mini-instruct", + "name": "Phi 4 Mini", + "display_name": "Phi 4 Mini", "modalities": { "input": [ "text" @@ -12830,8 +11965,8 @@ ] }, "limit": { - "context": 24000, - "output": 8192 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -12839,18 +11974,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 0.187, - "output": 0.374 + "input": 0.17, + "output": 0.68 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-09-2025", - "name": "Gemini 2.5 Flash Preview (09/2025)", - "display_name": "Gemini 2.5 Flash Preview (09/2025)", + "id": "gemini-2.5-flash-lite-preview-09-2025-thinking", + "name": "Gemini 2.5 Flash Lite Preview (09/2025) – Thinking", + "display_name": "Gemini 2.5 Flash Lite Preview (09/2025) – Thinking", "modalities": { "input": [ "text", @@ -12868,19 +12003,18 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "budget", "budget": { "default": -1, - "min": 0, + "min": 512, "max": 24576, "auto": -1, - "off": 0, "unit": "tokens" }, "summaries": true, @@ -12895,45 +12029,54 @@ "release_date": "2025-09-25", "last_updated": "2025-09-25", "cost": { - "input": 0.3, - "output": 2.5 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "GLM-4.6-Derestricted-v5", - "name": "GLM 4.6 Derestricted v5", - "display_name": "GLM 4.6 Derestricted v5", + "id": "claude-sonnet-4-thinking:64000", + "name": "Claude 4 Sonnet Thinking (64K)", + "display_name": "Claude 4 Sonnet Thinking (64K)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 64000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.4, - "output": 1.5 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "glm-4-plus", - "name": "GLM-4 Plus", - "display_name": "GLM-4 Plus", + "id": "GLM-4.5-Air-Derestricted-Iceblink-ReExtract", + "name": "GLM 4.5 Air Derestricted Iceblink ReExtract", + "display_name": "GLM 4.5 Air Derestricted Iceblink ReExtract", "modalities": { "input": [ "text" @@ -12943,8 +12086,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 98304 }, "tool_call": false, "reasoning": { @@ -12952,48 +12095,46 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-08-01", - "last_updated": "2024-08-01", + "release_date": "2025-12-12", + "last_updated": "2025-12-12", "cost": { - "input": 7.497, - "output": 7.497 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "Gemma-3-27B-Big-Tiger-v3", - "name": "Gemma 3 27B Big Tiger v3", - "display_name": "Gemma 3 27B Big Tiger v3", + "id": "qwen-image", + "name": "Qwen Image", + "display_name": "Qwen Image", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-08", - "last_updated": "2025-08-08", - "cost": { - "input": 0.306, - "output": 0.306 - }, - "type": "chat" + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "type": "imageGeneration" }, { - "id": "brave-research", - "name": "Brave (Research)", - "display_name": "Brave (Research)", + "id": "doubao-seed-1-6-thinking-250615", + "name": "Doubao Seed 1.6 Thinking", + "display_name": "Doubao Seed 1.6 Thinking", "modalities": { "input": [ "text" @@ -13003,7 +12144,7 @@ ] }, "limit": { - "context": 16384, + "context": 256000, "output": 16384 }, "tool_call": false, @@ -13012,45 +12153,54 @@ }, "attachment": false, "open_weights": false, - "release_date": "2023-03-02", - "last_updated": "2024-01-01", + "release_date": "2025-06-15", + "last_updated": "2025-06-15", "cost": { - "input": 5, - "output": 5 + "input": 0.204, + "output": 2.04 }, "type": "chat" }, { - "id": "hidream", - "name": "Hidream", - "display_name": "Hidream", + "id": "MiniMax-M2", + "name": "MiniMax M2", + "display_name": "MiniMax M2", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 131072 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "release_date": "2025-10-25", + "last_updated": "2025-10-25", + "cost": { + "input": 0.17, + "output": 1.53 + }, "type": "chat" }, { - "id": "qwen3-max-2026-01-23", - "name": "Qwen3 Max 2026-01-23", - "display_name": "Qwen3 Max 2026-01-23", + "id": "Llama-3.3-70B-The-Omega-Directive-Unslop-v2.0", + "name": "Llama 3.3 70B Omega Directive Unslop v2.0", + "display_name": "Llama 3.3 70B Omega Directive Unslop v2.0", "modalities": { "input": [ "text" @@ -13060,70 +12210,57 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-01-26", - "last_updated": "2026-01-26", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 1.2002, - "output": 6.001 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "claude-opus-4-1-20250805", - "name": "Claude 4.1 Opus", - "display_name": "Claude 4.1 Opus", + "id": "Llama-3.3-70B-Sapphira-0.2", + "name": "Llama 3.3 70B Sapphira 0.2", + "display_name": "Llama 3.3 70B Sapphira 0.2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 32768, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 14.994, - "output": 75.004 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "claude-sonnet-4-20250514", + "name": "Claude 4 Sonnet", + "display_name": "Claude 4 Sonnet", "modalities": { "input": [ "text", @@ -13144,21 +12281,23 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 1, - "output": 5 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "MiniMax-M1", - "name": "MiniMax M1", - "display_name": "MiniMax M1", + "id": "claude-sonnet-4-thinking", + "name": "Claude 4 Sonnet Thinking", + "display_name": "Claude 4 Sonnet Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -13166,26 +12305,33 @@ }, "limit": { "context": 1000000, - "output": 131072 + "output": 64000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-06-16", - "last_updated": "2025-06-16", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 0.1394, - "output": 1.3328 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "gemini-2.5-flash-nothinking", - "name": "Gemini 2.5 Flash (No Thinking)", - "display_name": "Gemini 2.5 Flash (No Thinking)", + "id": "gemini-2.5-flash-preview-09-2025-thinking", + "name": "Gemini 2.5 Flash Preview (09/2025) – Thinking", + "display_name": "Gemini 2.5 Flash Preview (09/2025) – Thinking", "modalities": { "input": [ "text", @@ -13200,7 +12346,7 @@ "context": 1048756, "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -13227,8 +12373,8 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { "input": 0.3, "output": 2.5 @@ -13236,9 +12382,9 @@ "type": "chat" }, { - "id": "exa-research-pro", - "name": "Exa (Research Pro)", - "display_name": "Exa (Research Pro)", + "id": "ernie-x1-32k-preview", + "name": "Ernie X1 32k", + "display_name": "Ernie X1 32k", "modalities": { "input": [ "text" @@ -13248,7 +12394,7 @@ ] }, "limit": { - "context": 16384, + "context": 32000, "output": 16384 }, "tool_call": false, @@ -13257,100 +12403,29 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-06-04", - "last_updated": "2025-06-04", - "cost": { - "input": 2.5, - "output": 2.5 - }, - "type": "chat" - }, - { - "id": "grok-3-fast-beta", - "name": "Grok 3 Fast Beta", - "display_name": "Grok 3 Fast Beta", - "modalities": { - "input": [ - "text", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131072 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "release_date": "2025-04-03", + "last_updated": "2025-04-03", "cost": { - "input": 5, - "output": 25 + "input": 0.33, + "output": 1.32 }, "type": "chat" }, { - "id": "claude-opus-4-5-20251101:thinking", - "name": "Claude 4.5 Opus Thinking", - "display_name": "Claude 4.5 Opus Thinking", + "id": "qwen-plus", + "name": "Qwen Plus", + "display_name": "Qwen Plus", "modalities": { "input": [ - "text", - "image", - "pdf" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 200000, - "output": 32000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-01", - "last_updated": "2025-11-01", - "cost": { - "input": 4.998, - "output": 25.007 - }, - "type": "chat" - }, - { - "id": "gemini-2.5-pro-exp-03-25", - "name": "Gemini 2.5 Pro Experimental 0325", - "display_name": "Gemini 2.5 Pro Experimental 0325", - "modalities": { - "input": [ - "text", - "image" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 995904, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -13360,41 +12435,31 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 2.5, - "output": 10 + "input": 0.3995, + "output": 1.2002 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-thinking", - "name": "Claude 3.7 Sonnet Thinking", - "display_name": "Claude 3.7 Sonnet Thinking", + "id": "v0-1.0-md", + "name": "v0 1.0 MD", + "display_name": "v0 1.0 MD", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -13402,115 +12467,76 @@ }, "limit": { "context": 200000, - "output": 16000 + "output": 64000 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "release_date": "2025-07-04", + "last_updated": "2025-07-04", "cost": { - "input": 2.992, - "output": 14.994 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "claude-opus-4-thinking:8192", - "name": "Claude 4 Opus Thinking (8K)", - "display_name": "Claude 4 Opus Thinking (8K)", + "id": "Magistral-Small-2506", + "name": "Magistral Small 2506", + "display_name": "Magistral Small 2506", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 32768, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 14.994, - "output": 75.004 + "input": 0.4, + "output": 1.4 }, "type": "chat" }, { - "id": "claude-sonnet-4-thinking:1024", - "name": "Claude 4 Sonnet Thinking (1K)", - "display_name": "Claude 4 Sonnet Thinking (1K)", + "id": "sonar-pro", + "name": "Perplexity Pro", + "display_name": "Perplexity Pro", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 200000, + "output": 128000 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { "input": 2.992, "output": 14.994 @@ -13518,9 +12544,9 @@ "type": "chat" }, { - "id": "Llama-3.3-70B-Magnum-v4-SE-Cirrus-x1-SLERP", - "name": "Llama 3.3 70B Magnum v4 SE Cirrus x1 SLERP", - "display_name": "Llama 3.3 70B Magnum v4 SE Cirrus x1 SLERP", + "id": "Qwen2.5-32B-EVA-v0.2", + "name": "Qwen 2.5 32b EVA", + "display_name": "Qwen 2.5 32b EVA", "modalities": { "input": [ "text" @@ -13530,8 +12556,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 24576, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -13539,18 +12565,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "release_date": "2024-09-01", + "last_updated": "2024-09-01", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.493, + "output": 0.493 }, "type": "chat" }, { - "id": "step-r1-v-mini", - "name": "Step R1 V Mini", - "display_name": "Step R1 V Mini", + "id": "exa-answer", + "name": "Exa (Answer)", + "display_name": "Exa (Answer)", "modalities": { "input": [ "text" @@ -13560,8 +12586,8 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -13569,18 +12595,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-04-08", - "last_updated": "2025-04-08", + "release_date": "2025-06-04", + "last_updated": "2025-06-04", "cost": { "input": 2.5, - "output": 11 + "output": 2.5 }, "type": "chat" }, { - "id": "ernie-x1-32k-preview", - "name": "Ernie X1 32k", - "display_name": "Ernie X1 32k", + "id": "doubao-seed-1-6-250615", + "name": "Doubao Seed 1.6", + "display_name": "Doubao Seed 1.6", "modalities": { "input": [ "text" @@ -13590,7 +12616,7 @@ ] }, "limit": { - "context": 32000, + "context": 256000, "output": 16384 }, "tool_call": false, @@ -13599,18 +12625,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-04-03", - "last_updated": "2025-04-03", + "release_date": "2025-06-15", + "last_updated": "2025-06-15", "cost": { - "input": 0.33, - "output": 1.32 + "input": 0.204, + "output": 0.51 }, "type": "chat" }, { - "id": "Llama-3.3-70B-StrawberryLemonade-v1.0", - "name": "Llama 3.3 70B StrawberryLemonade v1.0", - "display_name": "Llama 3.3 70B StrawberryLemonade v1.0", + "id": "Llama-3.3-70B-Forgotten-Safeword-3.6", + "name": "Llama 3.3 70B Forgotten Safeword 3.6", + "display_name": "Llama 3.3 70B Forgotten Safeword 3.6", "modalities": { "input": [ "text" @@ -13638,9 +12664,9 @@ "type": "chat" }, { - "id": "KAT-Coder-Exp-72B-1010", - "name": "KAT Coder Exp 72B 1010", - "display_name": "KAT Coder Exp 72B 1010", + "id": "KAT-Coder-Air-V1", + "name": "KAT Coder Air V1", + "display_name": "KAT Coder Air V1", "modalities": { "input": [ "text" @@ -13668,131 +12694,99 @@ "type": "chat" }, { - "id": "gemini-2.5-pro-preview-03-25", - "name": "Gemini 2.5 Pro Preview 0325", - "display_name": "Gemini 2.5 Pro Preview 0325", + "id": "phi-4-multimodal-instruct", + "name": "Phi 4 Multimodal", + "display_name": "Phi 4 Multimodal", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 2.5, - "output": 10 + "input": 0.07, + "output": 0.11 }, "type": "chat" }, { - "id": "claude-opus-4-thinking:1024", - "name": "Claude 4 Opus Thinking (1K)", - "display_name": "Claude 4 Opus Thinking (1K)", + "id": "soob3123/GrayLine-Qwen3-8B", + "name": "Grayline Qwen3 8B", + "display_name": "Grayline Qwen3 8B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 16384, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 14.994, - "output": 75.004 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "claude-sonnet-4-20250514", - "name": "Claude 4 Sonnet", - "display_name": "Claude 4 Sonnet", + "id": "soob3123/Veiled-Calla-12B", + "name": "Veiled Calla 12B", + "display_name": "Veiled Calla 12B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-04-13", + "last_updated": "2025-04-13", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Progenitor-V3.3", - "name": "Llama 3.3 70B Progenitor V3.3", - "display_name": "Llama 3.3 70B Progenitor V3.3", + "id": "soob3123/amoral-gemma3-27B-v2", + "name": "Amoral Gemma3 27B v2", + "display_name": "Amoral Gemma3 27B v2", "modalities": { "input": [ "text" @@ -13803,7 +12797,7 @@ }, "limit": { "context": 32768, - "output": 16384 + "output": 8192 }, "tool_call": false, "reasoning": { @@ -13811,18 +12805,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "release_date": "2025-05-23", + "last_updated": "2025-05-23", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "Qwen2.5-32B-EVA-v0.2", - "name": "Qwen 2.5 32b EVA", - "display_name": "Qwen 2.5 32b EVA", + "id": "EVA-UNIT-01/EVA-Qwen2.5-72B-v0.2", + "name": "EVA-Qwen2.5-72B-v0.2", + "display_name": "EVA-Qwen2.5-72B-v0.2", "modalities": { "input": [ "text" @@ -13832,7 +12826,7 @@ ] }, "limit": { - "context": 24576, + "context": 16384, "output": 8192 }, "tool_call": false, @@ -13841,18 +12835,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-09-01", - "last_updated": "2024-09-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.493, - "output": 0.493 + "input": 0.7989999999999999, + "output": 0.7989999999999999 }, "type": "chat" }, { - "id": "brave-pro", - "name": "Brave (Pro)", - "display_name": "Brave (Pro)", + "id": "EVA-UNIT-01/EVA-LLaMA-3.33-70B-v0.1", + "name": "EVA-LLaMA-3.33-70B-v0.1", + "display_name": "EVA-LLaMA-3.33-70B-v0.1", "modalities": { "input": [ "text" @@ -13862,8 +12856,8 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -13871,18 +12865,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2023-03-02", - "last_updated": "2024-01-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 5, - "output": 5 + "input": 2.006, + "output": 2.006 }, "type": "chat" }, { - "id": "step-2-16k-exp", - "name": "Step-2 16k Exp", - "display_name": "Step-2 16k Exp", + "id": "EVA-UNIT-01/EVA-Qwen2.5-32B-v0.2", + "name": "EVA-Qwen2.5-32B-v0.2", + "display_name": "EVA-Qwen2.5-32B-v0.2", "modalities": { "input": [ "text" @@ -13892,7 +12886,7 @@ ] }, "limit": { - "context": 16000, + "context": 16384, "output": 8192 }, "tool_call": false, @@ -13901,18 +12895,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-07-05", - "last_updated": "2024-07-05", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 7.004, - "output": 19.992 + "input": 0.7989999999999999, + "output": 0.7989999999999999 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Fallen-R1-v1", - "name": "Llama 3.3 70B Fallen R1 v1", - "display_name": "Llama 3.3 70B Fallen R1 v1", + "id": "EVA-UNIT-01/EVA-LLaMA-3.33-70B-v0.0", + "name": "EVA Llama 3.33 70B", + "display_name": "EVA Llama 3.33 70B", "modalities": { "input": [ "text" @@ -13922,7 +12916,7 @@ ] }, "limit": { - "context": 32768, + "context": 16384, "output": 16384 }, "tool_call": false, @@ -13931,68 +12925,29 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 0.306, - "output": 0.306 + "input": 2.006, + "output": 2.006 }, "type": "chat" }, { - "id": "claude-sonnet-4-thinking", - "name": "Claude 4 Sonnet Thinking", - "display_name": "Claude 4 Sonnet Thinking", + "id": "Gryphe/MythoMax-L2-13b", + "name": "MythoMax 13B", + "display_name": "MythoMax 13B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-02-24", - "last_updated": "2025-02-24", - "cost": { - "input": 2.992, - "output": 14.994 - }, - "type": "chat" - }, - { - "id": "doubao-1.5-pro-256k", - "name": "Doubao 1.5 Pro 256k", - "display_name": "Doubao 1.5 Pro 256k", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 16384 + "context": 4000, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -14000,22 +12955,21 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-03-12", - "last_updated": "2025-03-12", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 0.799, - "output": 1.445 + "input": 0.1003, + "output": 0.1003 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-20250219", - "name": "Claude 3.7 Sonnet", - "display_name": "Claude 3.7 Sonnet", + "id": "undi95/remm-slerp-l2-13b", + "name": "ReMM SLERP 13B", + "display_name": "ReMM SLERP 13B", "modalities": { "input": [ "text", - "image", "pdf" ], "output": [ @@ -14023,48 +12977,27 @@ ] }, "limit": { - "context": 200000, - "output": 16000 + "context": 6144, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.7989999999999999, + "output": 1.2069999999999999 }, "type": "chat" }, { - "id": "learnlm-1.5-pro-experimental", - "name": "Gemini LearnLM Experimental", - "display_name": "Gemini LearnLM Experimental", + "id": "nothingiisreal/L3.1-70B-Celeste-V0.1-BF16", + "name": "Llama 3.1 70B Celeste v0.1", + "display_name": "Llama 3.1 70B Celeste v0.1", "modalities": { "input": [ "text" @@ -14074,8 +13007,8 @@ ] }, "limit": { - "context": 32767, - "output": 8192 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -14083,18 +13016,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-05-14", - "last_updated": "2024-05-14", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 3.502, - "output": 10.506 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "deepseek-ai/deepseek-v3.2-exp", + "name": "DeepSeek V3.2 Exp", + "display_name": "DeepSeek V3.2 Exp", "modalities": { "input": [ "text" @@ -14104,54 +13037,57 @@ ] }, "limit": { - "context": 128000, + "context": 163840, "output": 65536 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.27999999999999997, + "output": 0.42000000000000004 }, "type": "chat" }, { - "id": "chroma", - "name": "Chroma", - "display_name": "Chroma", + "id": "deepseek-ai/DeepSeek-V3.1:thinking", + "name": "DeepSeek V3.1 Thinking", + "display_name": "DeepSeek V3.1 Thinking", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 65536 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-12", - "last_updated": "2025-08-12", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "cost": { + "input": 0.2, + "output": 0.7 + }, "type": "chat" }, { - "id": "Llama-3.3-70B-Predatorial-Extasy", - "name": "Llama 3.3 70B Predatorial Extasy", - "display_name": "Llama 3.3 70B Predatorial Extasy", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ "text" @@ -14161,27 +13097,39 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 163840 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.4, + "output": 1.7 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Aurora-Borealis", - "name": "Llama 3.3 70B Aurora Borealis", - "display_name": "Llama 3.3 70B Aurora Borealis", + "id": "deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ "text" @@ -14191,57 +13139,58 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-08-02", + "last_updated": "2025-08-02", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.25, + "output": 0.7 }, "type": "chat" }, { - "id": "Llama-3.3-70B-ArliAI-RPMax-v3", - "name": "Llama 3.3 70B ArliAI RPMax v3", - "display_name": "Llama 3.3 70B ArliAI RPMax v3", + "id": "deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 65536 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.2, + "output": 0.7 }, "type": "chat" }, { - "id": "venice-uncensored", - "name": "Venice Uncensored", - "display_name": "Venice Uncensored", + "id": "deepseek-ai/DeepSeek-V3.1-Terminus:thinking", + "name": "DeepSeek V3.1 Terminus (Thinking)", + "display_name": "DeepSeek V3.1 Terminus (Thinking)", "modalities": { "input": [ "text" @@ -14252,57 +13201,57 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 0.4, - "output": 0.4 + "input": 0.25, + "output": 0.7 }, "type": "chat" }, { - "id": "step-3", - "name": "Step-3", - "display_name": "Step-3", + "id": "deepseek-ai/deepseek-v3.2-exp-thinking", + "name": "DeepSeek V3.2 Exp Thinking", + "display_name": "DeepSeek V3.2 Exp Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 163840, + "output": 65536 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-07-31", - "last_updated": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.2499, - "output": 0.6494 + "input": 0.27999999999999997, + "output": 0.42000000000000004 }, "type": "chat" }, { - "id": "Llama-3.3-70B-The-Omega-Directive-Unslop-v2.0", - "name": "Llama 3.3 70B Omega Directive Unslop v2.0", - "display_name": "Llama 3.3 70B Omega Directive Unslop v2.0", + "id": "cohere/command-r-plus-08-2024", + "name": "Cohere: Command R+", + "display_name": "Cohere: Command R+", "modalities": { "input": [ "text" @@ -14312,27 +13261,27 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0.306, - "output": 0.306 + "input": 2.856, + "output": 14.246 }, "type": "chat" }, { - "id": "auto-model", - "name": "Auto model", - "display_name": "Auto model", + "id": "cohere/command-r", + "name": "Cohere: Command R", + "display_name": "Cohere: Command R", "modalities": { "input": [ "text" @@ -14342,8 +13291,8 @@ ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 128000, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -14351,22 +13300,21 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2024-03-11", + "last_updated": "2024-03-11", "cost": { - "input": 0, - "output": 0 + "input": 0.476, + "output": 1.428 }, "type": "chat" }, { - "id": "claude-opus-4-1-thinking:32768", - "name": "Claude 4.1 Opus Thinking (32K)", - "display_name": "Claude 4.1 Opus Thinking (32K)", + "id": "raifle/sorcererlm-8x22b", + "name": "SorcererLM 8x22B", + "display_name": "SorcererLM 8x22B", "modalities": { "input": [ "text", - "image", "pdf" ], "output": [ @@ -14374,34 +13322,27 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 16000, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 14.994, - "output": 75.004 + "input": 4.505, + "output": 4.505 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Shakudo", - "name": "Llama 3.3 70B Shakudo", - "display_name": "Llama 3.3 70B Shakudo", + "id": "inflatebot/MN-12B-Mag-Mell-R1", + "name": "Mag Mell R1", + "display_name": "Mag Mell R1", "modalities": { "input": [ "text" @@ -14411,8 +13352,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 16384, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -14420,18 +13361,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "Baichuan4-Air", - "name": "Baichuan 4 Air", - "display_name": "Baichuan 4 Air", + "id": "TEE/qwen3-30b-a3b-instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507 TEE", + "display_name": "Qwen3 30B A3B Instruct 2507 TEE", "modalities": { "input": [ "text" @@ -14441,7 +13382,7 @@ ] }, "limit": { - "context": 32768, + "context": 262000, "output": 32768 }, "tool_call": false, @@ -14450,49 +13391,54 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-08-19", - "last_updated": "2025-08-19", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 0.157, - "output": 0.157 + "input": 0.15, + "output": 0.44999999999999996 }, "type": "chat" }, { - "id": "kimi-thinking-preview", - "name": "Kimi Thinking Preview", - "display_name": "Kimi Thinking Preview", + "id": "TEE/minimax-m2.1", + "name": "MiniMax M2.1 TEE", + "display_name": "MiniMax M2.1 TEE", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 31.46, - "output": 31.46 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "qwen-turbo", - "name": "Qwen Turbo", - "display_name": "Qwen Turbo", + "id": "TEE/kimi-k2.5", + "name": "Kimi K2.5 TEE", + "display_name": "Kimi K2.5 TEE", "modalities": { "input": [ "text" @@ -14502,8 +13448,8 @@ ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 128000, + "output": 65535 }, "tool_call": false, "reasoning": { @@ -14522,87 +13468,90 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "release_date": "2026-01-29", + "last_updated": "2026-01-29", "cost": { - "input": 0.04998, - "output": 0.2006 + "input": 0.3, + "output": 1.9 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Mhnnn-x1", - "name": "Llama 3.3 70B Mhnnn x1", - "display_name": "Llama 3.3 70B Mhnnn x1", + "id": "TEE/qwen2.5-vl-72b-instruct", + "name": "Qwen2.5 VL 72B TEE", + "display_name": "Qwen2.5 VL 72B TEE", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 65536, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-02-01", + "last_updated": "2025-02-01", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.7, + "output": 0.7 }, "type": "chat" }, { - "id": "claude-opus-4-thinking:32768", - "name": "Claude 4 Opus Thinking (32K)", - "display_name": "Claude 4 Opus Thinking (32K)", + "id": "TEE/deepseek-r1-0528", + "name": "DeepSeek R1 0528 TEE", + "display_name": "DeepSeek R1 0528 TEE", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 65536 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 14.994, - "output": 75.004 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Argunaut-1-SFT", - "name": "Llama 3.3 70B Argunaut 1 SFT", - "display_name": "Llama 3.3 70B Argunaut 1 SFT", + "id": "TEE/deepseek-v3.2", + "name": "DeepSeek V3.2 TEE", + "display_name": "DeepSeek V3.2 TEE", "modalities": { "input": [ "text" @@ -14612,117 +13561,63 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 164000, + "output": 65536 }, "tool_call": false, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", - "cost": { - "input": 0.306, - "output": 0.306 - }, - "type": "chat" - }, - { - "id": "claude-opus-4-1-thinking:1024", - "name": "Claude 4.1 Opus Thinking (1K)", - "display_name": "Claude 4.1 Opus Thinking (1K)", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 32000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 14.994, - "output": 75.004 + "input": 0.5, + "output": 1 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "TEE/kimi-k2.5-thinking", + "name": "Kimi K2.5 Thinking TEE", + "display_name": "Kimi K2.5 Thinking TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 128000, + "output": 65535 }, "tool_call": false, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "release_date": "2026-01-29", + "last_updated": "2026-01-29", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.3, + "output": 1.9 }, "type": "chat" }, { - "id": "phi-4-multimodal-instruct", - "name": "Phi 4 Multimodal", - "display_name": "Phi 4 Multimodal", + "id": "TEE/gemma-3-27b-it", + "name": "Gemma 3 27B TEE", + "display_name": "Gemma 3 27B TEE", "modalities": { "input": [ "text" @@ -14732,8 +13627,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -14741,18 +13636,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "release_date": "2025-03-10", + "last_updated": "2025-03-10", "cost": { - "input": 0.07, - "output": 0.11 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "doubao-seed-2-0-code-preview-260215", - "name": "Doubao Seed 2.0 Code Preview", - "display_name": "Doubao Seed 2.0 Code Preview", + "id": "TEE/qwen3.5-397b-a17b", + "name": "Qwen3.5 397B A17B TEE", + "display_name": "Qwen3.5 397B A17B TEE", "modalities": { "input": [ "text" @@ -14762,27 +13657,38 @@ ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 258048, + "output": 65536 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "release_date": "2026-02-28", + "last_updated": "2026-02-28", "cost": { - "input": 0.782, - "output": 3.893 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "deepseek-reasoner-cheaper", - "name": "Deepseek R1 Cheaper", - "display_name": "Deepseek R1 Cheaper", + "id": "TEE/glm-4.7-flash", + "name": "GLM 4.7 Flash TEE", + "display_name": "GLM 4.7 Flash TEE", "modalities": { "input": [ "text" @@ -14792,27 +13698,32 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 203000, + "output": 65535 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.4, - "output": 1.7 + "input": 0.15, + "output": 0.5 }, "type": "chat" }, { - "id": "exa-answer", - "name": "Exa (Answer)", - "display_name": "Exa (Answer)", + "id": "TEE/glm-4.6", + "name": "GLM 4.6 TEE", + "display_name": "GLM 4.6 TEE", "modalities": { "input": [ "text" @@ -14822,27 +13733,32 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 203000, + "output": 65535 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-06-04", - "last_updated": "2025-06-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 2.5, - "output": 2.5 + "input": 0.75, + "output": 2 }, "type": "chat" }, { - "id": "v0-1.0-md", - "name": "v0 1.0 MD", - "display_name": "v0 1.0 MD", + "id": "TEE/gpt-oss-20b", + "name": "GPT-OSS 20B TEE", + "display_name": "GPT-OSS 20B TEE", "modalities": { "input": [ "text" @@ -14852,58 +13768,62 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-07-04", - "last_updated": "2025-07-04", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 3, - "output": 15 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "glm-4.1v-thinking-flash", - "name": "GLM 4.1V Thinking Flash", - "display_name": "GLM 4.1V Thinking Flash", + "id": "TEE/qwen3-coder", + "name": "Qwen3 Coder 480B TEE", + "display_name": "Qwen3 Coder 480B TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 8192 + "context": 128000, + "output": 32768 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.3, - "output": 0.3 + "input": 1.5, + "output": 2 }, "type": "chat" }, { - "id": "azure-o1", - "name": "Azure o1", - "display_name": "Azure o1", + "id": "TEE/kimi-k2-thinking", + "name": "Kimi K2 Thinking TEE", + "display_name": "Kimi K2 Thinking TEE", "modalities": { "input": [ "text" @@ -14913,27 +13833,38 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 65535 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2024-12-17", - "last_updated": "2024-12-17", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 14.994, - "output": 59.993 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "GLM-4.5-Air-Derestricted", - "name": "GLM 4.5 Air Derestricted", - "display_name": "GLM 4.5 Air Derestricted", + "id": "TEE/deepseek-v3.1", + "name": "DeepSeek V3.1 TEE", + "display_name": "DeepSeek V3.1 TEE", "modalities": { "input": [ "text" @@ -14943,8 +13874,8 @@ ] }, "limit": { - "context": 202600, - "output": 98304 + "context": 164000, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -14952,18 +13883,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1, + "output": 2.5 }, "type": "chat" }, { - "id": "azure-o3-mini", - "name": "Azure o3-mini", - "display_name": "Azure o3-mini", + "id": "TEE/llama3-3-70b", + "name": "Llama 3.3 70B", + "display_name": "Llama 3.3 70B", "modalities": { "input": [ "text" @@ -14973,8 +13904,8 @@ ] }, "limit": { - "context": 200000, - "output": 65536 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -14982,18 +13913,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "release_date": "2025-07-03", + "last_updated": "2025-07-03", "cost": { - "input": 1.088, - "output": 4.3996 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "qwen3.6-max-preview", - "name": "Qwen3.6 Max Preview", - "display_name": "Qwen3.6 Max Preview", + "id": "TEE/glm-4.7", + "name": "GLM 4.7 TEE", + "display_name": "GLM 4.7 TEE", "modalities": { "input": [ "text" @@ -15003,8 +13934,8 @@ ] }, "limit": { - "context": 245800, - "output": 65536 + "context": 131000, + "output": 65535 }, "tool_call": false, "reasoning": { @@ -15023,18 +13954,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2026-04-20", - "last_updated": "2026-04-21", + "release_date": "2026-01-29", + "last_updated": "2026-01-29", "cost": { - "input": 1.3, - "output": 7.8 + "input": 0.85, + "output": 3.3 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Sapphira-0.2", - "name": "Llama 3.3 70B Sapphira 0.2", - "display_name": "Llama 3.3 70B Sapphira 0.2", + "id": "TEE/gpt-oss-120b", + "name": "GPT-OSS 120B TEE", + "display_name": "GPT-OSS 120B TEE", "modalities": { "input": [ "text" @@ -15044,57 +13975,32 @@ ] }, "limit": { - "context": 32768, + "context": 131072, "output": 16384 }, "tool_call": false, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", - "cost": { - "input": 0.306, - "output": 0.306 - }, - "type": "chat" - }, - { - "id": "Llama-3.3-70B-Anthrobomination", - "name": "Llama 3.3 70B Anthrobomination", - "display_name": "Llama 3.3 70B Anthrobomination", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32768, - "output": 16384 + "supported": true }, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.306, - "output": 0.306 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "QwQ-32B-ArliAI-RpR-v1", - "name": "QwQ 32b Arli V1", - "display_name": "QwQ 32b Arli V1", + "id": "TEE/glm-5", + "name": "GLM 5 TEE", + "display_name": "GLM 5 TEE", "modalities": { "input": [ "text" @@ -15104,8 +14010,8 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 203000, + "output": 65535 }, "tool_call": false, "reasoning": { @@ -15124,50 +14030,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.2, - "output": 0.2 + "input": 1.2, + "output": 3.5 }, "type": "chat" }, { - "id": "claude-opus-4-20250514", - "name": "Claude 4 Opus", - "display_name": "Claude 4 Opus", + "id": "mlabonne/NeuralDaredevil-8B-abliterated", + "name": "Neural Daredevil 8B abliterated", + "display_name": "Neural Daredevil 8B abliterated", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-14", - "last_updated": "2025-05-14", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 14.994, - "output": 75.004 + "input": 0.44, + "output": 0.44 }, "type": "chat" }, { - "id": "yi-lightning", - "name": "Yi Lightning", - "display_name": "Yi Lightning", + "id": "MarinaraSpaghetti/NemoMix-Unleashed-12B", + "name": "NemoMix 12B Unleashed", + "display_name": "NemoMix 12B Unleashed", "modalities": { "input": [ "text" @@ -15177,8 +14081,8 @@ ] }, "limit": { - "context": 12000, - "output": 4096 + "context": 32768, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -15186,18 +14090,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-10-16", - "last_updated": "2024-10-16", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.2006, - "output": 0.2006 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Electra-R1", - "name": "Llama 3.3 70B Electra R1", - "display_name": "Llama 3.3 70B Electra R1", + "id": "Alibaba-NLP/Tongyi-DeepResearch-30B-A3B", + "name": "Tongyi DeepResearch 30B A3B", + "display_name": "Tongyi DeepResearch 30B A3B", "modalities": { "input": [ "text" @@ -15207,8 +14111,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 65536 }, "tool_call": false, "reasoning": { @@ -15216,18 +14120,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.08, + "output": 0.24000000000000002 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Forgotten-Abomination-v5.0", - "name": "Llama 3.3 70B Forgotten Abomination v5.0", - "display_name": "Llama 3.3 70B Forgotten Abomination v5.0", + "id": "baseten/Kimi-K2-Instruct-FP4", + "name": "Kimi K2 0711 Instruct FP4", + "display_name": "Kimi K2 0711 Instruct FP4", "modalities": { "input": [ "text" @@ -15237,8 +14141,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 131072 }, "tool_call": false, "reasoning": { @@ -15246,18 +14150,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.1, + "output": 2 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Cirrus-x1", - "name": "Llama 3.3 70B Cirrus x1", - "display_name": "Llama 3.3 70B Cirrus x1", + "id": "deepcogito/cogito-v1-preview-qwen-32B", + "name": "Cogito v1 Preview Qwen 32B", + "display_name": "Cogito v1 Preview Qwen 32B", "modalities": { "input": [ "text" @@ -15267,8 +14171,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -15276,18 +14180,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-05-10", + "last_updated": "2025-05-10", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1.7999999999999998, + "output": 1.7999999999999998 }, "type": "chat" }, { - "id": "grok-3-mini-beta", - "name": "Grok 3 Mini Beta", - "display_name": "Grok 3 Mini Beta", + "id": "deepcogito/cogito-v2.1-671b", + "name": "Cogito v2.1 671B MoE", + "display_name": "Cogito v2.1 671B MoE", "modalities": { "input": [ "text" @@ -15297,96 +14201,101 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "cost": { - "input": 0.3, - "output": 0.5 + "input": 1.25, + "output": 1.25 }, "type": "chat" }, { - "id": "auto-model-standard", - "name": "Auto model (Standard)", - "display_name": "Auto model (Standard)", + "id": "moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 256000, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, - "open_weights": false, - "release_date": "2024-06-01", - "last_updated": "2024-06-01", - "cost": { - "input": 9.996, - "output": 19.992 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-01-26", + "last_updated": "2026-01-26", + "cost": { + "input": 0.3, + "output": 1.9 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929-thinking", - "name": "Claude Sonnet 4.5 Thinking", - "display_name": "Claude Sonnet 4.5 Thinking", + "id": "moonshotai/kimi-k2-thinking-turbo-original", + "name": "Kimi K2 Thinking Turbo Original", + "display_name": "Kimi K2 Thinking Turbo Original", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 256000, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 2.992, - "output": 14.994 + "input": 1.15, + "output": 8 }, "type": "chat" }, { - "id": "v0-1.5-md", - "name": "v0 1.5 MD", - "display_name": "v0 1.5 MD", + "id": "moonshotai/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -15396,27 +14305,27 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 256000, + "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-07-04", - "last_updated": "2025-07-04", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 3, - "output": 15 + "input": 0.1, + "output": 2 }, "type": "chat" }, { - "id": "kimi-k2-instruct-fast", - "name": "Kimi K2 0711 Fast", - "display_name": "Kimi K2 0711 Fast", + "id": "moonshotai/Kimi-Dev-72B", + "name": "Kimi Dev 72B", + "display_name": "Kimi Dev 72B", "modalities": { "input": [ "text", @@ -15427,8 +14336,8 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 128000, + "output": 131072 }, "tool_call": false, "reasoning": { @@ -15436,48 +14345,50 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-07-15", - "last_updated": "2025-07-15", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.1, - "output": 2 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "glm-4-long", - "name": "GLM-4 Long", - "display_name": "GLM-4 Long", + "id": "moonshotai/kimi-k2.5:thinking", + "name": "Kimi K2.5 Thinking", + "display_name": "Kimi K2.5 Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 4096 + "context": 256000, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-08-01", - "last_updated": "2024-08-01", + "release_date": "2026-01-26", + "last_updated": "2026-01-26", "cost": { - "input": 0.2006, - "output": 0.2006 + "input": 0.3, + "output": 1.9 }, "type": "chat" }, { - "id": "jamba-large-1.7", - "name": "Jamba Large 1.7", - "display_name": "Jamba Large 1.7", + "id": "moonshotai/kimi-k2-thinking-original", + "name": "Kimi K2 Thinking Original", + "display_name": "Kimi K2 Thinking Original", "modalities": { "input": [ "text" @@ -15488,30 +14399,30 @@ }, "limit": { "context": 256000, - "output": 4096 + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 1.989, - "output": 7.99 + "input": 0.6, + "output": 2.5 }, "type": "chat" }, { - "id": "qvq-max", - "name": "Qwen: QvQ Max", - "display_name": "Qwen: QvQ Max", + "id": "moonshotai/kimi-k2-instruct-0711", + "name": "Kimi K2 0711", + "display_name": "Kimi K2 0711", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -15521,24 +14432,24 @@ "context": 128000, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-03-28", - "last_updated": "2025-03-28", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", "cost": { - "input": 1.4, - "output": 5.3 + "input": 0.1, + "output": 2 }, "type": "chat" }, { - "id": "gemini-2.0-flash-thinking-exp-1219", - "name": "Gemini 2.0 Flash Thinking 1219", - "display_name": "Gemini 2.0 Flash Thinking 1219", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -15548,27 +14459,68 @@ ] }, "limit": { - "context": 32767, - "output": 8192 + "context": 256000, + "output": 262144 }, - "tool_call": false, + "tool_call": true, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "cost": { + "input": 0.3, + "output": 1.2 + }, + "type": "chat" + }, + { + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 262144 + }, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-12-19", - "last_updated": "2024-12-19", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.1003, - "output": 0.408 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash Lite", - "display_name": "Gemini 2.0 Flash Lite", + "id": "moonshotai/kimi-k2.6:thinking", + "name": "Kimi K2.6 Thinking", + "display_name": "Kimi K2.6 Thinking", "modalities": { "input": [ "text", @@ -15579,57 +14531,64 @@ ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 256000, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": true, + "release_date": "2026-04-16", + "last_updated": "2026-04-21", "cost": { - "input": 0.0748, - "output": 0.306 + "input": 0.53, + "output": 2.73 }, "type": "chat" }, { - "id": "azure-gpt-4-turbo", - "name": "Azure gpt-4-turbo", - "display_name": "Azure gpt-4-turbo", + "id": "moonshotai/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, - "open_weights": false, - "release_date": "2023-11-06", - "last_updated": "2024-01-01", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-04-16", + "last_updated": "2026-04-21", "cost": { - "input": 9.996, - "output": 30.005 + "input": 0.53, + "output": 2.73 }, "type": "chat" }, { - "id": "Baichuan-M2", - "name": "Baichuan M2 32B Medical", - "display_name": "Baichuan M2 32B Medical", + "id": "Envoid/Llama-3.05-NT-Storybreaker-Ministral-70B", + "name": "Llama 3.05 Storybreaker Ministral 70b", + "display_name": "Llama 3.05 Storybreaker Ministral 70b", "modalities": { "input": [ "text" @@ -15639,8 +14598,8 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 16384, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -15648,49 +14607,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-08-19", - "last_updated": "2025-08-19", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 15.73, - "output": 15.73 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "qwen-long", - "name": "Qwen Long 10M", - "display_name": "Qwen Long 10M", + "id": "Envoid/Llama-3.05-Nemotron-Tenyxchat-Storybreaker-70B", + "name": "Nemotron Tenyxchat Storybreaker 70b", + "display_name": "Nemotron Tenyxchat Storybreaker 70b", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 10000000, + "context": 16384, "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-01-25", - "last_updated": "2025-01-25", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.1003, - "output": 0.408 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "sonar-reasoning-pro", - "name": "Perplexity Reasoning Pro", - "display_name": "Perplexity Reasoning Pro", + "id": "z-ai/glm-4.6:thinking", + "name": "GLM 4.6 Thinking", + "display_name": "GLM 4.6 Thinking", "modalities": { "input": [ "text" @@ -15700,28 +14658,28 @@ ] }, "limit": { - "context": 127000, - "output": 128000 + "context": 200000, + "output": 65535 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 2.006, - "output": 7.9985 + "input": 0.4, + "output": 1.5 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-05-20:thinking", - "name": "Gemini 2.5 Flash 0520 Thinking", - "display_name": "Gemini 2.5 Flash 0520 Thinking", + "id": "z-ai/glm-4.5v", + "name": "GLM 4.5V", + "display_name": "GLM 4.5V", "modalities": { "input": [ "text", @@ -15732,48 +14690,28 @@ ] }, "limit": { - "context": 1048000, - "output": 65536 + "context": 64000, + "output": 96000 }, "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, "open_weights": false, - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "release_date": "2025-11-22", + "last_updated": "2025-11-22", "cost": { - "input": 0.15, - "output": 3.5 + "input": 0.6, + "output": 1.7999999999999998 }, "type": "chat" }, { - "id": "GLM-4.5-Air-Derestricted-Steam-ReExtract", - "name": "GLM 4.5 Air Derestricted Steam ReExtract", - "display_name": "GLM 4.5 Air Derestricted Steam ReExtract", + "id": "z-ai/glm-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ "text" @@ -15783,60 +14721,69 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 200000, + "output": 65535 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-12-12", - "last_updated": "2025-12-12", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.4, + "output": 1.5 }, "type": "chat" }, { - "id": "Llama-3.3-70B-Dark-Ages-v0.1", - "name": "Llama 3.3 70B Dark Ages v0.1", - "display_name": "Llama 3.3 70B Dark Ages v0.1", + "id": "z-ai/glm-4.5v:thinking", + "name": "GLM 4.5V Thinking", + "display_name": "GLM 4.5V Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 64000, + "output": 96000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-11-22", + "last_updated": "2025-11-22", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.6, + "output": 1.7999999999999998 }, "type": "chat" }, { - "id": "Baichuan4-Turbo", - "name": "Baichuan 4 Turbo", - "display_name": "Baichuan 4 Turbo", + "id": "openai/chatgpt-4o-latest", + "name": "ChatGPT 4o", + "display_name": "ChatGPT 4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -15844,26 +14791,26 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 16384 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-19", - "last_updated": "2025-08-19", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 2.42, - "output": 2.42 + "input": 4.998, + "output": 14.993999999999998 }, "type": "chat" }, { - "id": "doubao-1.5-vision-pro-32k", - "name": "Doubao 1.5 Vision Pro 32k", - "display_name": "Doubao 1.5 Vision Pro 32k", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ "text", @@ -15874,8 +14821,8 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -15883,91 +14830,103 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-01-22", - "last_updated": "2025-01-22", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0.459, - "output": 1.377 + "input": 2.499, + "output": 9.996 }, "type": "chat" }, { - "id": "alibaba/qwen3.6-flash", - "name": "Qwen3.6 Flash", - "display_name": "Qwen3.6 Flash", + "id": "openai/gpt-4o-mini-search-preview", + "name": "GPT-4o mini Search Preview", + "display_name": "GPT-4o mini Search Preview", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 991800, - "output": 65536 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.19, - "output": 1.16 + "input": 0.088, + "output": 0.35 }, "type": "chat" }, { - "id": "inflection/inflection-3-pi", - "name": "Inflection 3 Pi", - "display_name": "Inflection 3 Pi", + "id": "openai/gpt-5.2", + "name": "GPT 5.2", + "display_name": "GPT 5.2", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-10-11", - "last_updated": "2024-10-11", + "release_date": "2026-01-01", + "last_updated": "2026-01-01", "cost": { - "input": 2.499, - "output": 9.996 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "inflection/inflection-3-productivity", - "name": "Inflection 3 Productivity", - "display_name": "Inflection 3 Productivity", + "id": "openai/gpt-3.5-turbo", + "name": "GPT-3.5 Turbo", + "display_name": "GPT-3.5 Turbo", "modalities": { "input": [ "text" @@ -15977,7 +14936,7 @@ ] }, "limit": { - "context": 8000, + "context": 16385, "output": 4096 }, "tool_call": false, @@ -15986,18 +14945,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-10-11", - "last_updated": "2024-10-11", + "release_date": "2022-11-30", + "last_updated": "2024-01-01", "cost": { - "input": 2.499, - "output": 9.996 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "essentialai/rnj-1-instruct", - "name": "RNJ-1 Instruct 8B", - "display_name": "RNJ-1 Instruct 8B", + "id": "openai/o3-pro-2025-06-10", + "name": "OpenAI o3-pro (2025-06-10)", + "display_name": "OpenAI o3-pro (2025-06-10)", "modalities": { "input": [ "text" @@ -16007,27 +14966,42 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 100000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2025-12-13", - "last_updated": "2025-12-13", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", "cost": { - "input": 0.15, - "output": 0.15 + "input": 9.996, + "output": 19.992 }, "type": "chat" }, { - "id": "LLM360/K2-Think", - "name": "K2-Think", - "display_name": "K2-Think", + "id": "openai/o1-preview", + "name": "OpenAI o1-preview", + "display_name": "OpenAI o1-preview", "modalities": { "input": [ "text" @@ -16042,22 +15016,37 @@ }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 0.17, - "output": 0.68 + "input": 14.993999999999998, + "output": 59.993 }, "type": "chat" }, { - "id": "TEE/kimi-k2.5", - "name": "Kimi K2.5 TEE", - "display_name": "Kimi K2.5 TEE", + "id": "openai/gpt-5.1-2025-11-13", + "name": "GPT-5.1 (2025-11-13)", + "display_name": "GPT-5.1 (2025-11-13)", "modalities": { "input": [ "text" @@ -16067,291 +15056,339 @@ ] }, "limit": { - "context": 128000, - "output": 65535 + "context": 1000000, + "output": 32768 }, "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, "open_weights": false, - "release_date": "2026-01-29", - "last_updated": "2026-01-29", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.3, - "output": 1.9 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "TEE/glm-4.7", - "name": "GLM 4.7 TEE", - "display_name": "GLM 4.7 TEE", + "id": "openai/gpt-5-chat-latest", + "name": "GPT 5 Chat", + "display_name": "GPT 5 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 65535 + "context": 400000, + "output": 128000 }, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-01-29", - "last_updated": "2026-01-29", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.85, - "output": 3.3 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "TEE/qwen3.5-397b-a17b", - "name": "Qwen3.5 397B A17B TEE", - "display_name": "Qwen3.5 397B A17B TEE", + "id": "openai/gpt-5.1-codex-mini", + "name": "GPT 5.1 Codex Mini", + "display_name": "GPT 5.1 Codex Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 258048, - "output": 65536 + "context": 400000, + "output": 128000 }, "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-28", - "last_updated": "2026-02-28", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.6, - "output": 3.6 + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "TEE/glm-5", - "name": "GLM 5 TEE", - "display_name": "GLM 5 TEE", + "id": "openai/gpt-5.2-pro", + "name": "GPT 5.2 Pro", + "display_name": "GPT 5.2 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 203000, - "output": 65535 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2026-01-01", + "last_updated": "2026-01-01", "cost": { - "input": 1.2, - "output": 3.5 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "TEE/qwen2.5-vl-72b-instruct", - "name": "Qwen2.5 VL 72B TEE", - "display_name": "Qwen2.5 VL 72B TEE", + "id": "openai/gpt-5-codex", + "name": "GPT-5 Codex", + "display_name": "GPT-5 Codex", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 256000, + "output": 32768 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-02-01", - "last_updated": "2025-02-01", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.7, - "output": 0.7 + "input": 9.996, + "output": 19.992 }, "type": "chat" }, { - "id": "TEE/minimax-m2.1", - "name": "MiniMax M2.1 TEE", - "display_name": "MiniMax M2.1 TEE", + "id": "openai/gpt-5.1-chat", + "name": "GPT 5.1 Chat", + "display_name": "GPT 5.1 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 400000, + "output": 128000 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.3, - "output": 1.2 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "TEE/qwen3-30b-a3b-instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507 TEE", - "display_name": "Qwen3 30B A3B Instruct 2507 TEE", + "id": "openai/gpt-5.1-chat-latest", + "name": "GPT 5.1 Chat (Latest)", + "display_name": "GPT 5.1 Chat (Latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 32768 + "context": 400000, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.15, - "output": 0.44999999999999996 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "TEE/deepseek-v3.1", - "name": "DeepSeek V3.1 TEE", - "display_name": "DeepSeek V3.1 TEE", + "id": "openai/gpt-4.1", + "name": "GPT 4.1", + "display_name": "GPT 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 8192 + "context": 1047576, + "output": 32768 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "release_date": "2025-09-10", + "last_updated": "2025-09-10", "cost": { - "input": 1, - "output": 2.5 + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "TEE/llama3-3-70b", - "name": "Llama 3.3 70B", - "display_name": "Llama 3.3 70B", + "id": "openai/gpt-4o-search-preview", + "name": "GPT-4o Search Preview", + "display_name": "GPT-4o Search Preview", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -16365,20 +15402,20 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-03", - "last_updated": "2025-07-03", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 2, - "output": 2 + "input": 1.47, + "output": 5.88 }, "type": "chat" }, { - "id": "TEE/glm-4.6", - "name": "GLM 4.6 TEE", - "display_name": "GLM 4.6 TEE", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -16388,12 +15425,13 @@ ] }, "limit": { - "context": 203000, - "output": 65535 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -16402,18 +15440,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.75, - "output": 2 + "input": 0.04, + "output": 0.15 }, "type": "chat" }, { - "id": "TEE/kimi-k2.5-thinking", - "name": "Kimi K2.5 Thinking TEE", - "display_name": "Kimi K2.5 Thinking TEE", + "id": "openai/gpt-oss-safeguard-20b", + "name": "GPT OSS Safeguard 20B", + "display_name": "GPT OSS Safeguard 20B", "modalities": { "input": [ "text" @@ -16424,7 +15462,7 @@ }, "limit": { "context": 128000, - "output": 65535 + "output": 16384 }, "tool_call": false, "reasoning": { @@ -16433,83 +15471,96 @@ }, "attachment": false, "open_weights": false, - "release_date": "2026-01-29", - "last_updated": "2026-01-29", + "release_date": "2025-10-29", + "last_updated": "2025-10-29", "cost": { - "input": 0.3, - "output": 1.9 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "TEE/gemma-3-27b-it", - "name": "Gemma 3 27B TEE", - "display_name": "Gemma 3 27B TEE", + "id": "openai/gpt-5-pro", + "name": "GPT 5 Pro", + "display_name": "GPT 5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", - "cost": { - "input": 0.2, - "output": 0.8 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "TEE/deepseek-v3.2", - "name": "DeepSeek V3.2 TEE", - "display_name": "DeepSeek V3.2 TEE", + "id": "openai/gpt-4.1-mini", + "name": "GPT 4.1 Mini", + "display_name": "GPT 4.1 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 65536 + "context": 1047576, + "output": 32768 }, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.5, - "output": 1 + "input": 0.4, + "output": 1.6 }, "type": "chat" }, { - "id": "TEE/gpt-oss-20b", - "name": "GPT-OSS 20B TEE", - "display_name": "GPT-OSS 20B TEE", + "id": "openai/gpt-4-turbo-preview", + "name": "GPT-4 Turbo Preview", + "display_name": "GPT-4 Turbo Preview", "modalities": { "input": [ "text" @@ -16519,176 +15570,216 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4096 }, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2023-11-06", + "last_updated": "2024-01-01", "cost": { - "input": 0.2, - "output": 0.8 + "input": 9.996, + "output": 30.004999999999995 }, "type": "chat" }, { - "id": "TEE/qwen3-coder", - "name": "Qwen3 Coder 480B TEE", - "display_name": "Qwen3 Coder 480B TEE", + "id": "openai/gpt-5.1", + "name": "GPT 5.1", + "display_name": "GPT 5.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 1.5, - "output": 2 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "TEE/glm-4.7-flash", - "name": "GLM 4.7 Flash TEE", - "display_name": "GLM 4.7 Flash TEE", + "id": "openai/gpt-5-nano", + "name": "GPT 5 Nano", + "display_name": "GPT 5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 203000, - "output": 65535 + "context": 400000, + "output": 128000 }, "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.15, - "output": 0.5 + "input": 0.05, + "output": 0.4 }, "type": "chat" }, { - "id": "TEE/gpt-oss-120b", - "name": "GPT-OSS 120B TEE", - "display_name": "GPT-OSS 120B TEE", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 128000, "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 2, - "output": 2 + "input": 0.1496, + "output": 0.595 }, "type": "chat" }, { - "id": "TEE/deepseek-r1-0528", - "name": "DeepSeek R1 0528 TEE", - "display_name": "DeepSeek R1 0528 TEE", + "id": "openai/o1-pro", + "name": "OpenAI o1 Pro", + "display_name": "OpenAI o1 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 200000, + "output": 100000 }, "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "release_date": "2025-01-25", + "last_updated": "2025-01-25", "cost": { - "input": 2, - "output": 2 + "input": 150, + "output": 600 }, "type": "chat" }, { - "id": "TEE/kimi-k2-thinking", - "name": "Kimi K2 Thinking TEE", - "display_name": "Kimi K2 Thinking TEE", + "id": "openai/gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -16696,37 +15787,26 @@ }, "limit": { "context": 128000, - "output": 65535 + "output": 4096 }, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "release_date": "2023-11-06", + "last_updated": "2024-01-01", "cost": { - "input": 2, - "output": 2 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "CrucibleLab/L3.3-70B-Loki-V2.0", - "name": "L3.3 70B Loki v2.0", - "display_name": "L3.3 70B Loki v2.0", + "id": "openai/o3-mini-low", + "name": "OpenAI o3-mini (Low)", + "display_name": "OpenAI o3-mini (Low)", "modalities": { "input": [ "text" @@ -16736,59 +15816,87 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 200000, + "output": 100000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2026-01-22", - "last_updated": "2026-01-22", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 9.996, + "output": 19.992 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2:thinking", - "name": "DeepSeek V3.2 Thinking", - "display_name": "DeepSeek V3.2 Thinking", + "id": "openai/o1", + "name": "OpenAI o1", + "display_name": "OpenAI o1", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 163000, - "output": 65536 + "context": 200000, + "output": 100000 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2024-12-17", + "last_updated": "2024-12-17", "cost": { - "input": 0.27999999999999997, - "output": 0.42000000000000004 + "input": 14.993999999999998, + "output": 59.993 }, "type": "chat" }, { - "id": "deepseek/deepseek-prover-v2-671b", - "name": "DeepSeek Prover v2 671B", - "display_name": "DeepSeek Prover v2 671B", + "id": "openai/o3-mini-high", + "name": "OpenAI o3-mini (High)", + "display_name": "OpenAI o3-mini (High)", "modalities": { "input": [ "text" @@ -16798,30 +15906,46 @@ ] }, "limit": { - "context": 160000, - "output": 16384 + "context": 200000, + "output": 100000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-04-30", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 1, - "output": 2.5 + "input": 0.64, + "output": 2.588 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-speciale", - "name": "DeepSeek V3.2 Speciale", - "display_name": "DeepSeek V3.2 Speciale", + "id": "openai/gpt-5.1-codex-max", + "name": "GPT 5.1 Codex Max", + "display_name": "GPT 5.1 Codex Max", "modalities": { "input": [ "text", + "image", "pdf" ], "output": [ @@ -16829,69 +15953,94 @@ ] }, "limit": { - "context": 163000, - "output": 65536 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.27999999999999997, - "output": 0.42000000000000004 + "input": 2.5, + "output": 20 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "openai/o4-mini-high", + "name": "OpenAI o4-mini high", + "display_name": "OpenAI o4-mini high", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 163000, - "output": 65536 + "context": 200000, + "output": 100000 }, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.27999999999999997, - "output": 0.42000000000000004 + "input": 1.1, + "output": 4.4 }, "type": "chat" }, { - "id": "Doctor-Shotgun/MS3.2-24B-Magnum-Diamond", - "name": "MS3.2 24B Magnum Diamond", - "display_name": "MS3.2 24B Magnum Diamond", + "id": "openai/o4-mini-deep-research", + "name": "OpenAI o4-mini Deep Research", + "display_name": "OpenAI o4-mini Deep Research", "modalities": { "input": [ "text" @@ -16901,30 +16050,46 @@ ] }, "limit": { - "context": 16384, - "output": 32768 + "context": 200000, + "output": 100000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 9.996, + "output": 19.992 }, "type": "chat" }, { - "id": "NeverSleep/Llama-3-Lumimaid-70B-v0.1", - "name": "Lumimaid 70b", - "display_name": "Lumimaid 70b", + "id": "openai/gpt-4.1-nano", + "name": "GPT 4.1 Nano", + "display_name": "GPT 4.1 Nano", "modalities": { "input": [ "text", + "image", "pdf" ], "output": [ @@ -16932,8 +16097,8 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 1047576, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -16941,18 +16106,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 2.006, - "output": 2.006 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "NeverSleep/Lumimaid-v0.2-70B", - "name": "Lumimaid v0.2", - "display_name": "Lumimaid v0.2", + "id": "openai/o4-mini", + "name": "OpenAI o4-mini", + "display_name": "OpenAI o4-mini", "modalities": { "input": [ "text" @@ -16962,147 +16127,233 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 200000, + "output": 100000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 1, - "output": 1.5 + "input": 1.1, + "output": 4.4 }, "type": "chat" }, { - "id": "Steelskull/L3.3-Cu-Mai-R1-70b", - "name": "Llama 3.3 70B Cu Mai", - "display_name": "Llama 3.3 70B Cu Mai", + "id": "openai/gpt-5.1-codex", + "name": "GPT 5.1 Codex", + "display_name": "GPT 5.1 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 400000, + "output": 128000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "Steelskull/L3.3-Nevoria-R1-70b", - "name": "Steelskull Nevoria R1 70b", - "display_name": "Steelskull Nevoria R1 70b", + "id": "openai/gpt-4o-2024-11-20", + "name": "GPT-4o (2024-11-20)", + "display_name": "GPT-4o (2024-11-20)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, + "context": 128000, "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "Steelskull/L3.3-MS-Evayale-70B", - "name": "Evayale 70b ", - "display_name": "Evayale 70b ", + "id": "openai/gpt-5.2-codex", + "name": "GPT 5.2 Codex", + "display_name": "GPT 5.2 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "Steelskull/L3.3-Electra-R1-70b", - "name": "Steelskull Electra R1 70b", - "display_name": "Steelskull Electra R1 70b", + "id": "openai/gpt-5-mini", + "name": "GPT 5 Mini", + "display_name": "GPT 5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 400000, + "output": 128000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.69989, - "output": 0.69989 + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "Steelskull/L3.3-MS-Nevoria-70b", - "name": "Steelskull Nevoria 70b", - "display_name": "Steelskull Nevoria 70b", + "id": "openai/o3-mini", + "name": "OpenAI o3-mini", + "display_name": "OpenAI o3-mini", "modalities": { "input": [ "text" @@ -17112,87 +16363,105 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 200000, + "output": 100000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 1.1, + "output": 4.4 }, "type": "chat" }, { - "id": "Steelskull/L3.3-MS-Evalebis-70b", - "name": "MS Evalebis 70b", - "display_name": "MS Evalebis 70b", + "id": "openai/gpt-5.2-chat", + "name": "GPT 5.2 Chat", + "display_name": "GPT 5.2 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, + "context": 400000, "output": 16384 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2026-01-01", + "last_updated": "2026-01-01", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "miromind-ai/mirothinker-v1.5-235b", - "name": "MiroThinker v1.5 235B", - "display_name": "MiroThinker v1.5 235B", + "id": "openai/gpt-4o-2024-08-06", + "name": "GPT-4o (2024-08-06)", + "display_name": "GPT-4o (2024-08-06)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 4000 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-01-07", - "last_updated": "2026-01-07", + "release_date": "2024-08-06", + "last_updated": "2024-08-06", "cost": { - "input": 0.3, - "output": 1.2 + "input": 2.499, + "output": 9.996 }, "type": "chat" }, { - "id": "pamanseau/OpenReasoning-Nemotron-32B", - "name": "OpenReasoning Nemotron 32B", - "display_name": "OpenReasoning Nemotron 32B", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -17202,28 +16471,33 @@ ] }, "limit": { - "context": 32768, - "output": 65536 + "context": 128000, + "output": 16384 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": false, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.05, + "output": 0.25 }, "type": "chat" }, { - "id": "arcee-ai/trinity-mini", - "name": "Trinity Mini", - "display_name": "Trinity Mini", + "id": "openai/o3", + "name": "OpenAI o3", + "display_name": "OpenAI o3", "modalities": { "input": [ "text" @@ -17233,27 +16507,42 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 100000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.045000000000000005, - "output": 0.15 + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "arcee-ai/trinity-large", - "name": "Trinity Large", - "display_name": "Trinity Large", + "id": "openai/o3-deep-research", + "name": "OpenAI o3 Deep Research", + "display_name": "OpenAI o3 Deep Research", "modalities": { "input": [ "text" @@ -17263,57 +16552,96 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 100000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.25, - "output": 1 + "input": 9.996, + "output": 19.992 }, "type": "chat" }, { - "id": "cognitivecomputations/dolphin-2.9.2-qwen2-72b", - "name": "Dolphin 72b", - "display_name": "Dolphin 72b", + "id": "openai/gpt-5", + "name": "GPT 5", + "display_name": "GPT 5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "deepcogito/cogito-v1-preview-qwen-32B", - "name": "Cogito v1 Preview Qwen 32B", - "display_name": "Cogito v1 Preview Qwen 32B", + "id": "zai-org/glm-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ "text" @@ -17323,27 +16651,33 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-10", - "last_updated": "2025-05-10", + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 1.7999999999999998, - "output": 1.7999999999999998 + "input": 0.3, + "output": 2.55 }, "type": "chat" }, { - "id": "deepcogito/cogito-v2.1-671b", - "name": "Cogito v2.1 671B MoE", - "display_name": "Cogito v2.1 671B MoE", + "id": "zai-org/glm-5:thinking", + "name": "GLM 5 Thinking", + "display_name": "GLM 5 Thinking", "modalities": { "input": [ "text" @@ -17353,28 +16687,28 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 1.25, - "output": 1.25 + "input": 0.3, + "output": 2.55 }, "type": "chat" }, { - "id": "Salesforce/Llama-xLAM-2-70b-fc-r", - "name": "Llama-xLAM-2 70B fc-r", - "display_name": "Llama-xLAM-2 70B fc-r", + "id": "zai-org/glm-4.7-flash", + "name": "GLM 4.7 Flash", + "display_name": "GLM 4.7 Flash", "modalities": { "input": [ "text" @@ -17384,27 +16718,33 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-13", - "last_updated": "2025-04-13", + "open_weights": true, + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 2.5, - "output": 2.5 + "input": 0.07, + "output": 0.4 }, "type": "chat" }, { - "id": "soob3123/Veiled-Calla-12B", - "name": "Veiled Calla 12B", - "display_name": "Veiled Calla 12B", + "id": "zai-org/glm-5.1:thinking", + "name": "GLM 5.1 Thinking", + "display_name": "GLM 5.1 Thinking", "modalities": { "input": [ "text" @@ -17414,27 +16754,28 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 200000, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-13", - "last_updated": "2025-04-13", + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { "input": 0.3, - "output": 0.3 + "output": 2.55 }, "type": "chat" }, { - "id": "soob3123/GrayLine-Qwen3-8B", - "name": "Grayline Qwen3 8B", - "display_name": "Grayline Qwen3 8B", + "id": "zai-org/glm-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ "text" @@ -17444,27 +16785,39 @@ ] }, "limit": { - "context": 16384, - "output": 32768 + "context": 200000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "open_weights": true, + "release_date": "2026-01-29", + "last_updated": "2026-01-29", "cost": { - "input": 0.3, - "output": 0.3 + "input": 0.15, + "output": 0.8 }, "type": "chat" }, { - "id": "soob3123/amoral-gemma3-27B-v2", - "name": "Amoral Gemma3 27B v2", - "display_name": "Amoral Gemma3 27B v2", + "id": "zai-org/glm-5", + "name": "GLM 5", + "display_name": "GLM 5", "modalities": { "input": [ "text" @@ -17474,30 +16827,43 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 200000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-23", - "last_updated": "2025-05-23", + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { "input": 0.3, - "output": 0.3 + "output": 2.55 }, "type": "chat" }, { - "id": "nex-agi/deepseek-v3.1-nex-n1", - "name": "DeepSeek V3.1 Nex N1", - "display_name": "DeepSeek V3.1 Nex N1", + "id": "unsloth/gemma-3-27b-it", + "name": "Gemma 3 27B IT", + "display_name": "Gemma 3 27B IT", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" @@ -17505,56 +16871,57 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 96000 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-10", - "last_updated": "2025-12-10", + "release_date": "2025-03-10", + "last_updated": "2025-03-10", "cost": { - "input": 0.27999999999999997, - "output": 0.42000000000000004 + "input": 0.2992, + "output": 0.2992 }, "type": "chat" }, { - "id": "Envoid/Llama-3.05-NT-Storybreaker-Ministral-70B", - "name": "Llama 3.05 Storybreaker Ministral 70b", - "display_name": "Llama 3.05 Storybreaker Ministral 70b", + "id": "unsloth/gemma-3-12b-it", + "name": "Gemma 3 12B IT", + "display_name": "Gemma 3 12B IT", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 128000, + "output": 131072 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-03-10", + "last_updated": "2025-03-10", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.272, + "output": 0.272 }, "type": "chat" }, { - "id": "Envoid/Llama-3.05-Nemotron-Tenyxchat-Storybreaker-70B", - "name": "Nemotron Tenyxchat Storybreaker 70b", - "display_name": "Nemotron Tenyxchat Storybreaker 70b", + "id": "unsloth/gemma-3-1b-it", + "name": "Gemma 3 1B IT", + "display_name": "Gemma 3 1B IT", "modalities": { "input": [ "text" @@ -17564,7 +16931,7 @@ ] }, "limit": { - "context": 16384, + "context": 128000, "output": 8192 }, "tool_call": false, @@ -17573,18 +16940,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-03-10", + "last_updated": "2025-03-10", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.1003, + "output": 0.1003 }, "type": "chat" }, { - "id": "anthracite-org/magnum-v4-72b", - "name": "Magnum v4 72B", - "display_name": "Magnum v4 72B", + "id": "unsloth/gemma-3-4b-it", + "name": "Gemma 3 4B IT", + "display_name": "Gemma 3 4B IT", "modalities": { "input": [ "text", @@ -17595,7 +16962,7 @@ ] }, "limit": { - "context": 16384, + "context": 128000, "output": 8192 }, "tool_call": false, @@ -17604,18 +16971,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-03-10", + "last_updated": "2025-03-10", "cost": { - "input": 2.006, - "output": 2.992 + "input": 0.2006, + "output": 0.2006 }, "type": "chat" }, { - "id": "anthracite-org/magnum-v2-72b", - "name": "Magnum V2 72B", - "display_name": "Magnum V2 72B", + "id": "aion-labs/aion-1.0", + "name": "Aion 1.0", + "display_name": "Aion 1.0", "modalities": { "input": [ "text" @@ -17625,7 +16992,7 @@ ] }, "limit": { - "context": 16384, + "context": 65536, "output": 8192 }, "tool_call": false, @@ -17634,18 +17001,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "release_date": "2025-02-01", + "last_updated": "2025-02-01", "cost": { - "input": 2.006, - "output": 2.992 + "input": 3.995, + "output": 7.99 }, "type": "chat" }, { - "id": "ReadyArt/MS3.2-The-Omega-Directive-24B-Unslop-v2.0", - "name": "Omega Directive 24B Unslop v2.0", - "display_name": "Omega Directive 24B Unslop v2.0", + "id": "aion-labs/aion-rp-llama-3.1-8b", + "name": "Llama 3.1 8b (uncensored)", + "display_name": "Llama 3.1 8b (uncensored)", "modalities": { "input": [ "text" @@ -17655,8 +17022,8 @@ ] }, "limit": { - "context": 16384, - "output": 32768 + "context": 32768, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -17664,18 +17031,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.5, - "output": 0.5 + "input": 0.2006, + "output": 0.2006 }, "type": "chat" }, { - "id": "ReadyArt/The-Omega-Abomination-L-70B-v1.0", - "name": "The Omega Abomination V1", - "display_name": "The Omega Abomination V1", + "id": "aion-labs/aion-1.0-mini", + "name": "Aion 1.0 mini (DeepSeek)", + "display_name": "Aion 1.0 mini (DeepSeek)", "modalities": { "input": [ "text" @@ -17685,8 +17052,8 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 131072, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -17694,49 +17061,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-02-20", + "last_updated": "2025-02-20", "cost": { - "input": 0.7, - "output": 0.95 + "input": 0.7989999999999999, + "output": 1.394 }, "type": "chat" }, { - "id": "undi95/remm-slerp-l2-13b", - "name": "ReMM SLERP 13B", - "display_name": "ReMM SLERP 13B", + "id": "Doctor-Shotgun/MS3.2-24B-Magnum-Diamond", + "name": "MS3.2 24B Magnum Diamond", + "display_name": "MS3.2 24B Magnum Diamond", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 6144, - "output": 4096 + "context": 16384, + "output": 32768 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.7989999999999999, - "output": 1.2069999999999999 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "MarinaraSpaghetti/NemoMix-Unleashed-12B", - "name": "NemoMix 12B Unleashed", - "display_name": "NemoMix 12B Unleashed", + "id": "chutesai/Mistral-Small-3.2-24B-Instruct-2506", + "name": "Mistral Small 3.2 24b Instruct", + "display_name": "Mistral Small 3.2 24b Instruct", "modalities": { "input": [ "text" @@ -17746,8 +17112,8 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 128000, + "output": 131072 }, "tool_call": false, "reasoning": { @@ -17755,49 +17121,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.2, + "output": 0.4 }, "type": "chat" }, { - "id": "allenai/molmo-2-8b", - "name": "Molmo 2 8B", - "display_name": "Molmo 2 8B", + "id": "LLM360/K2-Think", + "name": "K2-Think", + "display_name": "K2-Think", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 36864, - "output": 36864 + "context": 128000, + "output": 32768 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.17, + "output": 0.68 }, "type": "chat" }, { - "id": "allenai/olmo-3.1-32b-instruct", - "name": "Olmo 3.1 32B Instruct", - "display_name": "Olmo 3.1 32B Instruct", + "id": "Sao10K/L3-8B-Stheno-v3.2", + "name": "Sao10K Stheno 8b", + "display_name": "Sao10K Stheno 8b", "modalities": { "input": [ "text" @@ -17807,7 +17172,7 @@ ] }, "limit": { - "context": 65536, + "context": 16384, "output": 8192 }, "tool_call": false, @@ -17816,18 +17181,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2026-01-25", - "last_updated": "2026-01-25", + "release_date": "2024-11-29", + "last_updated": "2024-11-29", "cost": { - "input": 0.2, - "output": 0.6 + "input": 0.2006, + "output": 0.2006 }, "type": "chat" }, { - "id": "allenai/olmo-3.1-32b-think", - "name": "Olmo 3.1 32B Think", - "display_name": "Olmo 3.1 32B Think", + "id": "Sao10K/L3.1-70B-Hanami-x1", + "name": "Llama 3.1 70B Hanami", + "display_name": "Llama 3.1 70B Hanami", "modalities": { "input": [ "text" @@ -17837,28 +17202,27 @@ ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-01-25", - "last_updated": "2026-01-25", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.15, - "output": 0.5 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "allenai/olmo-3-32b-think", - "name": "Olmo 3 32B Think", - "display_name": "Olmo 3 32B Think", + "id": "Sao10K/L3.3-70B-Euryale-v2.3", + "name": "Llama 3.3 70B Euryale", + "display_name": "Llama 3.3 70B Euryale", "modalities": { "input": [ "text" @@ -17868,28 +17232,27 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 20480, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.3, - "output": 0.44999999999999996 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "stepfun-ai/step-3.5-flash:thinking", - "name": "Step 3.5 Flash Thinking", - "display_name": "Step 3.5 Flash Thinking", + "id": "Sao10K/L3.1-70B-Euryale-v2.2", + "name": "Llama 3.1 70B Euryale", + "display_name": "Llama 3.1 70B Euryale", "modalities": { "input": [ "text" @@ -17899,28 +17262,27 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 20480, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-02-02", - "last_updated": "2026-02-02", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.306, + "output": 0.357 }, "type": "chat" }, { - "id": "stepfun-ai/step-3.5-flash", - "name": "Step 3.5 Flash", - "display_name": "Step 3.5 Flash", + "id": "amazon/nova-pro-v1", + "name": "Amazon Nova Pro 1.0", + "display_name": "Amazon Nova Pro 1.0", "modalities": { "input": [ "text" @@ -17930,28 +17292,27 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 300000, + "output": 32000 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-02-02", - "last_updated": "2026-02-02", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.7989999999999999, + "output": 3.1959999999999997 }, "type": "chat" }, { - "id": "zai-org/glm-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "amazon/nova-2-lite-v1", + "name": "Amazon Nova 2 Lite", + "display_name": "Amazon Nova 2 Lite", "modalities": { "input": [ "text" @@ -17961,39 +17322,27 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 1000000, + "output": 65535 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-29", - "last_updated": "2026-01-29", + "open_weights": false, + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.15, - "output": 0.8 + "input": 0.5099999999999999, + "output": 4.25 }, "type": "chat" }, { - "id": "zai-org/glm-5", - "name": "GLM 5", - "display_name": "GLM 5", + "id": "amazon/nova-lite-v1", + "name": "Amazon Nova Lite 1.0", + "display_name": "Amazon Nova Lite 1.0", "modalities": { "input": [ "text" @@ -18003,39 +17352,27 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 300000, + "output": 5120 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "open_weights": false, + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.3, - "output": 2.55 + "input": 0.0595, + "output": 0.238 }, "type": "chat" }, { - "id": "zai-org/glm-5.1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "amazon/nova-micro-v1", + "name": "Amazon Nova Micro 1.0", + "display_name": "Amazon Nova Micro 1.0", "modalities": { "input": [ "text" @@ -18045,33 +17382,27 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 128000, + "output": 5120 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "open_weights": false, + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.3, - "output": 2.55 + "input": 0.0357, + "output": 0.1394 }, "type": "chat" }, { - "id": "zai-org/glm-5.1:thinking", - "name": "GLM 5.1 Thinking", - "display_name": "GLM 5.1 Thinking", + "id": "CrucibleLab/L3.3-70B-Loki-V2.0", + "name": "L3.3 70B Loki v2.0", + "display_name": "L3.3 70B Loki v2.0", "modalities": { "input": [ "text" @@ -18081,28 +17412,27 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 16384, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "open_weights": false, + "release_date": "2026-01-22", + "last_updated": "2026-01-22", "cost": { - "input": 0.3, - "output": 2.55 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "zai-org/glm-5:thinking", - "name": "GLM 5 Thinking", - "display_name": "GLM 5 Thinking", + "id": "THUDM/GLM-4-32B-0414", + "name": "GLM 4 32B 0414", + "display_name": "GLM 4 32B 0414", "modalities": { "input": [ "text" @@ -18112,28 +17442,27 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 65536 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "open_weights": false, + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.3, - "output": 2.55 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "zai-org/glm-4.7-flash", - "name": "GLM 4.7 Flash", - "display_name": "GLM 4.7 Flash", + "id": "THUDM/GLM-Z1-32B-0414", + "name": "GLM Z1 32B 0414", + "display_name": "GLM Z1 32B 0414", "modalities": { "input": [ "text" @@ -18143,33 +17472,27 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 65536 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "open_weights": false, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.07, - "output": 0.4 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "featherless-ai/Qwerky-72B", - "name": "Qwerky 72B", - "display_name": "Qwerky 72B", + "id": "THUDM/GLM-Z1-Rumination-32B-0414", + "name": "GLM Z1 Rumination 32B 0414", + "display_name": "GLM Z1 Rumination 32B 0414", "modalities": { "input": [ "text" @@ -18180,7 +17503,7 @@ }, "limit": { "context": 32000, - "output": 8192 + "output": 65536 }, "tool_call": false, "reasoning": { @@ -18188,18 +17511,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-03-20", - "last_updated": "2025-03-20", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.5, - "output": 0.5 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "mlabonne/NeuralDaredevil-8B-abliterated", - "name": "Neural Daredevil 8B abliterated", - "display_name": "Neural Daredevil 8B abliterated", + "id": "THUDM/GLM-4-9B-0414", + "name": "GLM 4 9B 0414", + "display_name": "GLM 4 9B 0414", "modalities": { "input": [ "text" @@ -18209,8 +17532,8 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 32000, + "output": 8000 }, "tool_call": false, "reasoning": { @@ -18218,49 +17541,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.44, - "output": 0.44 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "raifle/sorcererlm-8x22b", - "name": "SorcererLM 8x22B", - "display_name": "SorcererLM 8x22B", + "id": "THUDM/GLM-Z1-9B-0414", + "name": "GLM Z1 9B 0414", + "display_name": "GLM Z1 9B 0414", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 8192 + "context": 32000, + "output": 8000 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 4.505, - "output": 4.505 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "mistralai/mixtral-8x7b-instruct-v0.1", - "name": "Mixtral 8x7B", - "display_name": "Mixtral 8x7B", + "id": "inflection/inflection-3-productivity", + "name": "Inflection 3 Productivity", + "display_name": "Inflection 3 Productivity", "modalities": { "input": [ "text" @@ -18270,8 +17592,8 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 8000, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -18279,18 +17601,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2024-10-11", + "last_updated": "2024-10-11", "cost": { - "input": 0.27, - "output": 0.27 + "input": 2.499, + "output": 9.996 }, "type": "chat" }, { - "id": "mistralai/mistral-saba", - "name": "Mistral Saba", - "display_name": "Mistral Saba", + "id": "inflection/inflection-3-pi", + "name": "Inflection 3 Pi", + "display_name": "Inflection 3 Pi", "modalities": { "input": [ "text" @@ -18300,8 +17622,8 @@ ] }, "limit": { - "context": 32000, - "output": 32768 + "context": 8000, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -18309,49 +17631,54 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "release_date": "2024-10-11", + "last_updated": "2024-10-11", "cost": { - "input": 0.1989, - "output": 0.595 + "input": 2.499, + "output": 9.996 }, "type": "chat" }, { - "id": "mistralai/mistral-large-3-675b-instruct-2512", - "name": "Mistral Large 3 675B", - "display_name": "Mistral Large 3 675B", + "id": "minimax/minimax-m2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 256000 + "context": 200000, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "release_date": "2025-12-19", + "last_updated": "2025-12-19", "cost": { - "input": 1, - "output": 3 + "input": 0.33, + "output": 1.32 }, "type": "chat" }, { - "id": "mistralai/devstral-2-123b-instruct-2512", - "name": "Devstral 2 123B", - "display_name": "Devstral 2 123B", + "id": "minimax/minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -18361,27 +17688,33 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 204800, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.4, - "output": 1.4 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "mistralai/codestral-2508", - "name": "Codestral 2508", - "display_name": "Codestral 2508", + "id": "minimax/minimax-m2-her", + "name": "MiniMax M2-her", + "display_name": "MiniMax M2-her", "modalities": { "input": [ "text" @@ -18391,8 +17724,8 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 65532, + "output": 2048 }, "tool_call": false, "reasoning": { @@ -18400,79 +17733,91 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-08-01", - "last_updated": "2025-08-01", + "release_date": "2026-01-24", + "last_updated": "2026-01-24", "cost": { - "input": 0.3, - "output": 0.8999999999999999 + "input": 0.30200000000000005, + "output": 1.2069999999999999 }, "type": "chat" }, { - "id": "mistralai/ministral-14b-instruct-2512", - "name": "Ministral 3 14B", - "display_name": "Ministral 3 14B", + "id": "minimax/minimax-m2.7", + "name": "MiniMax M2.7", + "display_name": "MiniMax M2.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 204800, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "mistralai/mistral-tiny", - "name": "Mistral Tiny", - "display_name": "Mistral Tiny", + "id": "minimax/minimax-01", + "name": "MiniMax 01", + "display_name": "MiniMax 01", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 1000192, + "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2023-12-11", - "last_updated": "2024-01-01", + "release_date": "2025-01-15", + "last_updated": "2025-01-15", "cost": { - "input": 0.25499999999999995, - "output": 0.25499999999999995 + "input": 0.1394, + "output": 1.1219999999999999 }, "type": "chat" }, { - "id": "mistralai/ministral-8b-2512", - "name": "Ministral 8B", - "display_name": "Ministral 8B", + "id": "Tongyi-Zhiwen/QwenLong-L1-32B", + "name": "QwenLong L1 32B", + "display_name": "QwenLong L1 32B", "modalities": { "input": [ "text" @@ -18482,8 +17827,8 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 40960 }, "tool_call": false, "reasoning": { @@ -18491,78 +17836,82 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-04", - "last_updated": "2025-12-04", + "release_date": "2025-01-25", + "last_updated": "2025-01-25", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.13999999999999999, + "output": 0.6 }, "type": "chat" }, { - "id": "mistralai/mixtral-8x22b-instruct-v0.1", - "name": "Mixtral 8x22B", - "display_name": "Mixtral 8x22B", + "id": "x-ai/grok-4-07-09", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 32768 + "context": 256000, + "output": 131072 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.8999999999999999, - "output": 0.8999999999999999 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "mistralai/mistral-medium-3.1", - "name": "Mistral Medium 3.1", - "display_name": "Mistral Medium 3.1", + "id": "x-ai/grok-4-fast:thinking", + "name": "Grok 4 Fast Thinking", + "display_name": "Grok 4 Fast Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 2000000, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.4, - "output": 2 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "mistralai/ministral-3b-2512", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "x-ai/grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ "text" @@ -18572,57 +17921,65 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 256000, + "output": 131072 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-12-04", - "last_updated": "2025-12-04", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.2, + "output": 1.5 }, "type": "chat" }, { - "id": "mistralai/Mistral-Nemo-Instruct-2407", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "x-ai/grok-4.1-fast-reasoning", + "name": "Grok 4.1 Fast Reasoning", + "display_name": "Grok 4.1 Fast Reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 2000000, + "output": 131072 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "cost": { - "input": 0.1003, - "output": 0.1207 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "mistralai/mistral-medium-3", - "name": "Mistral Medium 3", - "display_name": "Mistral Medium 3", + "id": "x-ai/grok-4-fast", + "name": "Grok 4 Fast", + "display_name": "Grok 4 Fast", "modalities": { "input": [ "text", @@ -18633,58 +17990,60 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 2000000, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-09-20", + "last_updated": "2025-09-20", "cost": { - "input": 0.4, - "output": 2 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "mistralai/mistral-7b-instruct", - "name": "Mistral 7B Instruct", - "display_name": "Mistral 7B Instruct", + "id": "x-ai/grok-4.1-fast", + "name": "Grok 4.1 Fast", + "display_name": "Grok 4.1 Fast", "modalities": { "input": [ "text", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 2000000, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2024-05-27", - "last_updated": "2024-05-27", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "cost": { - "input": 0.0544, - "output": 0.0544 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "mistralai/Devstral-Small-2505", - "name": "Mistral Devstral Small 2505", - "display_name": "Mistral Devstral Small 2505", + "id": "Salesforce/Llama-xLAM-2-70b-fc-r", + "name": "Llama-xLAM-2 70B fc-r", + "display_name": "Llama-xLAM-2 70B fc-r", "modalities": { "input": [ "text" @@ -18694,8 +18053,8 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -18703,18 +18062,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-08-02", - "last_updated": "2025-08-02", + "release_date": "2025-04-13", + "last_updated": "2025-04-13", "cost": { - "input": 0.060000000000000005, - "output": 0.060000000000000005 + "input": 2.5, + "output": 2.5 }, "type": "chat" }, { - "id": "mistralai/mistral-small-creative", - "name": "Mistral Small Creative", - "display_name": "Mistral Small Creative", + "id": "nvidia/nvidia-nemotron-nano-9b-v2", + "name": "Nvidia Nemotron Nano 9B v2", + "display_name": "Nvidia Nemotron Nano 9B v2", "modalities": { "input": [ "text" @@ -18724,27 +18083,27 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "release_date": "2025-08-18", + "last_updated": "2025-08-18", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.17, + "output": 0.68 }, "type": "chat" }, { - "id": "mistralai/mistral-large", - "name": "Mistral Large 2411", - "display_name": "Mistral Large 2411", + "id": "nvidia/Llama-3_3-Nemotron-Super-49B-v1_5", + "name": "Nvidia Nemotron Super 49B v1.5", + "display_name": "Nvidia Nemotron Super 49B v1.5", "modalities": { "input": [ "text" @@ -18755,7 +18114,7 @@ }, "limit": { "context": 128000, - "output": 256000 + "output": 16384 }, "tool_call": false, "reasoning": { @@ -18763,18 +18122,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-02-26", - "last_updated": "2024-02-26", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 2.006, - "output": 6.001 + "input": 0.05, + "output": 0.25 }, "type": "chat" }, { - "id": "mistralai/ministral-14b-2512", - "name": "Ministral 14B", - "display_name": "Ministral 14B", + "id": "nvidia/Llama-3.3-Nemotron-Super-49B-v1", + "name": "Nvidia Nemotron Super 49B", + "display_name": "Nvidia Nemotron Super 49B", "modalities": { "input": [ "text" @@ -18784,8 +18143,8 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -18793,18 +18152,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-04", - "last_updated": "2025-12-04", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "shisa-ai/shisa-v2.1-llama3.3-70b", - "name": "Shisa V2.1 Llama 3.3 70B", - "display_name": "Shisa V2.1 Llama 3.3 70B", + "id": "nvidia/Llama-3.1-Nemotron-70B-Instruct-HF", + "name": "Nvidia Nemotron 70b", + "display_name": "Nvidia Nemotron 70b", "modalities": { "input": [ "text" @@ -18814,8 +18173,8 @@ ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 16384, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -18823,18 +18182,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.5, - "output": 0.5 + "input": 0.357, + "output": 0.408 }, "type": "chat" }, { - "id": "shisa-ai/shisa-v2-llama3.3-70b", - "name": "Shisa V2 Llama 3.3 70B", - "display_name": "Shisa V2 Llama 3.3 70B", + "id": "nvidia/Llama-3.1-Nemotron-Ultra-253B-v1", + "name": "Nvidia Nemotron Ultra 253B", + "display_name": "Nvidia Nemotron Ultra 253B", "modalities": { "input": [ "text" @@ -18853,18 +18212,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "release_date": "2025-07-03", + "last_updated": "2025-07-03", "cost": { - "input": 0.5, - "output": 0.5 + "input": 0.4, + "output": 0.8 }, "type": "chat" }, { - "id": "meta-llama/llama-3.3-70b-instruct", - "name": "Llama 3.3 70b Instruct", - "display_name": "Llama 3.3 70b Instruct", + "id": "nvidia/nemotron-3-nano-30b-a3b", + "name": "Nvidia Nemotron 3 Nano 30B", + "display_name": "Nvidia Nemotron 3 Nano 30B", "modalities": { "input": [ "text" @@ -18874,122 +18233,269 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 256000, + "output": 262144 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27", + "release_date": "2025-12-15", + "last_updated": "2025-12-15", "cost": { - "input": 0.05, - "output": 0.23 + "input": 0.17, + "output": 0.68 }, "type": "chat" }, { - "id": "meta-llama/llama-4-scout", - "name": "Llama 4 Scout", - "display_name": "Llama 4 Scout", + "id": "anthropic/claude-sonnet-4.6:thinking", + "name": "Claude Sonnet 4.6 Thinking", + "display_name": "Claude Sonnet 4.6 Thinking", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 328000, - "output": 65536 + "context": 1000000, + "output": 128000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 0.085, - "output": 0.46 + "input": 2.992, + "output": 14.993999999999998 }, "type": "chat" }, { - "id": "meta-llama/llama-4-maverick", - "name": "Llama 4 Maverick", - "display_name": "Llama 4 Maverick", + "id": "anthropic/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 128000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 0.18000000000000002, - "output": 0.8 + "input": 2.992, + "output": 14.993999999999998 }, "type": "chat" }, { - "id": "meta-llama/llama-3.2-90b-vision-instruct", - "name": "Llama 3.2 Medium", - "display_name": "Llama 3.2 Medium", + "id": "anthropic/claude-opus-4.6:thinking:low", + "name": "Claude 4.6 Opus Thinking Low", + "display_name": "Claude 4.6 Opus Thinking Low", "modalities": { "input": [ + "text", + "image", + "pdf" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 1000000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "cost": { + "input": 4.998, + "output": 25.007 + }, + "type": "chat" + }, + { + "id": "anthropic/claude-opus-4.6", + "name": "Claude 4.6 Opus", + "display_name": "Claude 4.6 Opus", + "modalities": { + "input": [ + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1000000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.9009999999999999, - "output": 0.9009999999999999 + "input": 4.998, + "output": 25.007 }, "type": "chat" }, { - "id": "meta-llama/llama-3.2-3b-instruct", - "name": "Llama 3.2 3b Instruct", - "display_name": "Llama 3.2 3b Instruct", + "id": "anthropic/claude-opus-4.6:thinking:medium", + "name": "Claude 4.6 Opus Thinking Medium", + "display_name": "Claude 4.6 Opus Thinking Medium", "modalities": { "input": [ "text", + "image", "pdf" ], "output": [ @@ -18997,50 +18503,165 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.0306, - "output": 0.0493 + "input": 4.998, + "output": 25.007 }, "type": "chat" }, { - "id": "meta-llama/llama-3.1-8b-instruct", - "name": "Llama 3.1 8b Instruct", - "display_name": "Llama 3.1 8b Instruct", + "id": "anthropic/claude-opus-4.6:thinking:max", + "name": "Claude 4.6 Opus Thinking Max", + "display_name": "Claude 4.6 Opus Thinking Max", "modalities": { "input": [ + "text", + "image", + "pdf" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 1000000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "cost": { + "input": 4.998, + "output": 25.007 + }, + "type": "chat" + }, + { + "id": "anthropic/claude-opus-4.6:thinking", + "name": "Claude 4.6 Opus Thinking", + "display_name": "Claude 4.6 Opus Thinking", + "modalities": { + "input": [ + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1000000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.0544, - "output": 0.0544 + "input": 4.998, + "output": 25.007 }, "type": "chat" }, @@ -19075,9 +18696,9 @@ "type": "chat" }, { - "id": "baseten/Kimi-K2-Instruct-FP4", - "name": "Kimi K2 0711 Instruct FP4", - "display_name": "Kimi K2 0711 Instruct FP4", + "id": "shisa-ai/shisa-v2-llama3.3-70b", + "name": "Shisa V2 Llama 3.3 70B", + "display_name": "Shisa V2 Llama 3.3 70B", "modalities": { "input": [ "text" @@ -19088,7 +18709,7 @@ }, "limit": { "context": 128000, - "output": 131072 + "output": 16384 }, "tool_call": false, "reasoning": { @@ -19096,18 +18717,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 0.1, - "output": 2 + "input": 0.5, + "output": 0.5 }, "type": "chat" }, { - "id": "Gryphe/MythoMax-L2-13b", - "name": "MythoMax 13B", - "display_name": "MythoMax 13B", + "id": "shisa-ai/shisa-v2.1-llama3.3-70b", + "name": "Shisa V2.1 Llama 3.3 70B", + "display_name": "Shisa V2.1 Llama 3.3 70B", "modalities": { "input": [ "text" @@ -19117,7 +18738,7 @@ ] }, "limit": { - "context": 4000, + "context": 32768, "output": 4096 }, "tool_call": false, @@ -19126,18 +18747,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.1003, - "output": 0.1003 + "input": 0.5, + "output": 0.5 }, "type": "chat" }, { - "id": "x-ai/grok-4-fast:thinking", - "name": "Grok 4 Fast Thinking", - "display_name": "Grok 4 Fast Thinking", + "id": "mistralai/ministral-14b-instruct-2512", + "name": "Ministral 3 14B", + "display_name": "Ministral 3 14B", "modalities": { "input": [ "text", @@ -19148,28 +18769,27 @@ ] }, "limit": { - "context": 2000000, - "output": 131072 + "context": 262144, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "x-ai/grok-4-07-09", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "mistralai/mistral-large-3-675b-instruct-2512", + "name": "Mistral Large 3 675B", + "display_name": "Mistral Large 3 675B", "modalities": { "input": [ "text", @@ -19180,60 +18800,57 @@ ] }, "limit": { - "context": 256000, - "output": 131072 + "context": 262144, + "output": 256000 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 3, - "output": 15 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "x-ai/grok-4-fast", - "name": "Grok 4 Fast", - "display_name": "Grok 4 Fast", + "id": "mistralai/Devstral-Small-2505", + "name": "Mistral Devstral Small 2505", + "display_name": "Mistral Devstral Small 2505", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 131072 + "context": 32768, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-20", - "last_updated": "2025-09-20", + "release_date": "2025-08-02", + "last_updated": "2025-08-02", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.060000000000000005, + "output": 0.060000000000000005 }, "type": "chat" }, { - "id": "x-ai/grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "mistralai/mistral-saba", + "name": "Mistral Saba", + "display_name": "Mistral Saba", "modalities": { "input": [ "text" @@ -19243,97 +18860,87 @@ ] }, "limit": { - "context": 256000, - "output": 131072 + "context": 32000, + "output": 32768 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0.2, - "output": 1.5 + "input": 0.1989, + "output": 0.595 }, "type": "chat" }, { - "id": "x-ai/grok-4.1-fast", - "name": "Grok 4.1 Fast", - "display_name": "Grok 4.1 Fast", + "id": "mistralai/mistral-small-creative", + "name": "Mistral Small Creative", + "display_name": "Mistral Small Creative", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 131072 + "context": 32768, + "output": 32768 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-20", - "last_updated": "2025-11-20", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "x-ai/grok-4.1-fast-reasoning", - "name": "Grok 4.1 Fast Reasoning", - "display_name": "Grok 4.1 Fast Reasoning", + "id": "mistralai/codestral-2508", + "name": "Codestral 2508", + "display_name": "Codestral 2508", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 131072 + "context": 256000, + "output": 32768 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-20", - "last_updated": "2025-11-20", + "release_date": "2025-08-01", + "last_updated": "2025-08-01", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.3, + "output": 0.8999999999999999 }, "type": "chat" }, { - "id": "tencent/Hunyuan-MT-7B", - "name": "Hunyuan MT 7B", - "display_name": "Hunyuan MT 7B", + "id": "mistralai/mixtral-8x22b-instruct-v0.1", + "name": "Mixtral 8x22B", + "display_name": "Mixtral 8x22B", "modalities": { "input": [ "text" @@ -19343,8 +18950,8 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 65536, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -19352,53 +18959,51 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 10, - "output": 20 + "input": 0.8999999999999999, + "output": 0.8999999999999999 }, "type": "chat" }, { - "id": "microsoft/wizardlm-2-8x22b", - "name": "WizardLM-2 8x22B", - "display_name": "WizardLM-2 8x22B", + "id": "mistralai/ministral-14b-2512", + "name": "Ministral 14B", + "display_name": "Ministral 14B", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 262144, + "output": 32768 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "release_date": "2025-12-04", + "last_updated": "2025-12-04", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "microsoft/MAI-DS-R1-FP8", - "name": "Microsoft DeepSeek R1", - "display_name": "Microsoft DeepSeek R1", + "id": "mistralai/mistral-large", + "name": "Mistral Large 2411", + "display_name": "Mistral Large 2411", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" @@ -19406,26 +19011,26 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 256000 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2024-02-26", + "last_updated": "2024-02-26", "cost": { - "input": 0.3, - "output": 0.3 + "input": 2.006, + "output": 6.001 }, "type": "chat" }, { - "id": "cohere/command-r", - "name": "Cohere: Command R", - "display_name": "Cohere: Command R", + "id": "mistralai/ministral-3b-2512", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ "text" @@ -19435,8 +19040,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -19444,18 +19049,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-03-11", - "last_updated": "2024-03-11", + "release_date": "2025-12-04", + "last_updated": "2025-12-04", "cost": { - "input": 0.476, - "output": 1.428 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "cohere/command-r-plus-08-2024", - "name": "Cohere: Command R+", - "display_name": "Cohere: Command R+", + "id": "mistralai/Mistral-Nemo-Instruct-2407", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -19465,87 +19070,89 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 16384, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 2.856, - "output": 14.246 + "input": 0.1003, + "output": 0.1207 }, "type": "chat" }, { - "id": "chutesai/Mistral-Small-3.2-24B-Instruct-2506", - "name": "Mistral Small 3.2 24b Instruct", - "display_name": "Mistral Small 3.2 24b Instruct", + "id": "mistralai/mistral-medium-3", + "name": "Mistral Medium 3", + "display_name": "Mistral Medium 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 131072 + "context": 131072, + "output": 32768 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.2, - "output": 0.4 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "nvidia/Llama-3.1-Nemotron-Ultra-253B-v1", - "name": "Nvidia Nemotron Ultra 253B", - "display_name": "Nvidia Nemotron Ultra 253B", + "id": "mistralai/mistral-7b-instruct", + "name": "Mistral 7B Instruct", + "display_name": "Mistral 7B Instruct", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-03", - "last_updated": "2025-07-03", + "release_date": "2024-05-27", + "last_updated": "2024-05-27", "cost": { - "input": 0.4, - "output": 0.8 + "input": 0.0544, + "output": 0.0544 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-nano-30b-a3b", - "name": "Nvidia Nemotron 3 Nano 30B", - "display_name": "Nvidia Nemotron 3 Nano 30B", + "id": "mistralai/mixtral-8x7b-instruct-v0.1", + "name": "Mixtral 8x7B", + "display_name": "Mixtral 8x7B", "modalities": { "input": [ "text" @@ -19555,8 +19162,8 @@ ] }, "limit": { - "context": 256000, - "output": 262144 + "context": 32768, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -19564,18 +19171,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-15", - "last_updated": "2025-12-15", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.17, - "output": 0.68 + "input": 0.27, + "output": 0.27 }, "type": "chat" }, { - "id": "nvidia/nvidia-nemotron-nano-9b-v2", - "name": "Nvidia Nemotron Nano 9B v2", - "display_name": "Nvidia Nemotron Nano 9B v2", + "id": "mistralai/ministral-8b-2512", + "name": "Ministral 8B", + "display_name": "Ministral 8B", "modalities": { "input": [ "text" @@ -19585,8 +19192,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -19594,18 +19201,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-08-18", - "last_updated": "2025-08-18", + "release_date": "2025-12-04", + "last_updated": "2025-12-04", "cost": { - "input": 0.17, - "output": 0.68 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "nvidia/Llama-3.1-Nemotron-70B-Instruct-HF", - "name": "Nvidia Nemotron 70b", - "display_name": "Nvidia Nemotron 70b", + "id": "mistralai/devstral-2-123b-instruct-2512", + "name": "Devstral 2 123B", + "display_name": "Devstral 2 123B", "modalities": { "input": [ "text" @@ -19615,8 +19222,8 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 262144, + "output": 65536 }, "tool_call": false, "reasoning": { @@ -19624,18 +19231,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "cost": { - "input": 0.357, - "output": 0.408 + "input": 0.4, + "output": 1.4 }, "type": "chat" }, { - "id": "nvidia/Llama-3.3-Nemotron-Super-49B-v1", - "name": "Nvidia Nemotron Super 49B", - "display_name": "Nvidia Nemotron Super 49B", + "id": "mistralai/mistral-tiny", + "name": "Mistral Tiny", + "display_name": "Mistral Tiny", "modalities": { "input": [ "text" @@ -19645,8 +19252,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32000, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -19654,18 +19261,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "release_date": "2023-12-11", + "last_updated": "2024-01-01", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.25499999999999995, + "output": 0.25499999999999995 }, "type": "chat" }, { - "id": "nvidia/Llama-3_3-Nemotron-Super-49B-v1_5", - "name": "Nvidia Nemotron Super 49B v1.5", - "display_name": "Nvidia Nemotron Super 49B v1.5", + "id": "mistralai/mistral-medium-3.1", + "name": "Mistral Medium 3.1", + "display_name": "Mistral Medium 3.1", "modalities": { "input": [ "text" @@ -19675,8 +19282,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -19684,109 +19291,148 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.05, - "output": 0.25 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1:thinking", - "name": "DeepSeek V3.1 Thinking", - "display_name": "DeepSeek V3.1 Thinking", + "id": "qwen/Qwen3.6-35B-A3B:thinking", + "name": "Qwen3.6 35B A3B Thinking", + "display_name": "Qwen3.6 35B A3B Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 262144, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "open_weights": true, + "release_date": "2026-04-19", + "last_updated": "2026-04-21", "cost": { - "input": 0.2, - "output": 0.7 + "input": 0.29, + "output": 1.74 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "qwen/qwen3.5-397b-a17b", + "name": "Qwen3.5 397B A17B", + "display_name": "Qwen3.5 397B A17B", "modalities": { "input": [ "text", - "pdf" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 258048, "output": 65536 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.2, - "output": 0.7 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1-Terminus:thinking", - "name": "DeepSeek V3.1 Terminus (Thinking)", - "display_name": "DeepSeek V3.1 Terminus (Thinking)", + "id": "qwen/Qwen3.6-35B-A3B", + "name": "Qwen3.6 35B A3B", + "display_name": "Qwen3.6 35B A3B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 262144, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "open_weights": true, + "release_date": "2026-04-17", + "last_updated": "2026-04-21", "cost": { - "input": 0.25, - "output": 0.7 + "input": 0.29, + "output": 1.74 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-v3.2-exp-thinking", - "name": "DeepSeek V3.2 Exp Thinking", - "display_name": "DeepSeek V3.2 Exp Thinking", + "id": "tencent/Hunyuan-MT-7B", + "name": "Hunyuan MT 7B", + "display_name": "Hunyuan MT 7B", "modalities": { "input": [ "text" @@ -19796,28 +19442,27 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 0.27999999999999997, - "output": 0.42000000000000004 + "input": 10, + "output": 20 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-v3.2-exp", - "name": "DeepSeek V3.2 Exp", - "display_name": "DeepSeek V3.2 Exp", + "id": "google/gemini-flash-1.5", + "name": "Gemini 1.5 Flash", + "display_name": "Gemini 1.5 Flash", "modalities": { "input": [ "text" @@ -19827,8 +19472,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 2000000, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -19836,29 +19481,30 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", - "cost": { - "input": 0.27999999999999997, - "output": 0.42000000000000004 + "release_date": "2024-05-14", + "last_updated": "2024-05-14", + "cost": { + "input": 0.0748, + "output": 0.306 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", + "id": "google/gemini-3-flash-preview-thinking", + "name": "Gemini 3 Flash Thinking", + "display_name": "Gemini 3 Flash Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 163840 + "context": 1048756, + "output": 65536 }, "tool_call": false, "reasoning": { @@ -19868,147 +19514,122 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-05-28", - "cost": { - "input": 0.4, - "output": 1.7 - }, - "type": "chat" - }, - { - "id": "deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 65536 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-02", - "last_updated": "2025-08-02", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.25, - "output": 0.7 + "input": 0.5, + "output": 3 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-max", - "name": "GPT 5.1 Codex Max", - "display_name": "GPT 5.1 Codex Max", + "id": "google/gemini-3-flash-preview", + "name": "Gemini 3 Flash (Preview)", + "display_name": "Gemini 3 Flash (Preview)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048756, + "output": 65536 }, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", "low", "medium", "high" ], - "visibility": "hidden" + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 2.5, - "output": 20 + "input": 0.5, + "output": 3 }, "type": "chat" }, { - "id": "openai/gpt-5.2-chat", - "name": "GPT 5.2 Chat", - "display_name": "GPT 5.2 Chat", + "id": "microsoft/wizardlm-2-8x22b", + "name": "WizardLM-2 8x22B", + "display_name": "WizardLM-2 8x22B", "modalities": { "input": [ "text", - "image" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 16384 + "context": 65536, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-01-01", - "last_updated": "2026-01-01", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 1.75, - "output": 14 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini-search-preview", - "name": "GPT-4o mini Search Preview", - "display_name": "GPT-4o mini Search Preview", + "id": "microsoft/MAI-DS-R1-FP8", + "name": "Microsoft DeepSeek R1", + "display_name": "Microsoft DeepSeek R1", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" @@ -20016,220 +19637,151 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.088, - "output": 0.35 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "openai/chatgpt-4o-latest", - "name": "ChatGPT 4o", - "display_name": "ChatGPT 4o", + "id": "pamanseau/OpenReasoning-Nemotron-32B", + "name": "OpenReasoning Nemotron 32B", + "display_name": "OpenReasoning Nemotron 32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 65536 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 4.998, - "output": 14.993999999999998 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "openai/gpt-5.2-pro", - "name": "GPT 5.2 Pro", - "display_name": "GPT 5.2 Pro", + "id": "Infermatic/MN-12B-Inferor-v0.0", + "name": "Mistral Nemo Inferor 12B", + "display_name": "Mistral Nemo Inferor 12B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-01-01", - "last_updated": "2026-01-01", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 21, - "output": 168 + "input": 0.25499999999999995, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "GPT 5 Mini", - "display_name": "GPT 5 Mini", + "id": "NeverSleep/Lumimaid-v0.2-70B", + "name": "Lumimaid v0.2", + "display_name": "Lumimaid v0.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.25, - "output": 2 + "input": 1, + "output": 1.5 }, "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "GPT 5 Nano", - "display_name": "GPT 5 Nano", + "id": "NeverSleep/Llama-3-Lumimaid-70B-v0.1", + "name": "Lumimaid 70b", + "display_name": "Lumimaid 70b", "modalities": { "input": [ "text", - "image" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.05, - "output": 0.4 + "input": 2.006, + "output": 2.006 }, "type": "chat" }, { - "id": "openai/gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "nex-agi/deepseek-v3.1-nex-n1", + "name": "DeepSeek V3.1 Nex N1", + "display_name": "DeepSeek V3.1 Nex N1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -20237,30 +19789,29 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2023-11-06", - "last_updated": "2024-01-01", + "release_date": "2025-12-10", + "last_updated": "2025-12-10", "cost": { - "input": 10, - "output": 30 + "input": 0.27999999999999997, + "output": 0.42000000000000004 }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "GPT 5.2", - "display_name": "GPT 5.2", + "id": "anthracite-org/magnum-v4-72b", + "name": "Magnum v4 72B", + "display_name": "Magnum v4 72B", "modalities": { "input": [ "text", - "image", "pdf" ], "output": [ @@ -20268,50 +19819,27 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-01-01", - "last_updated": "2026-01-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.75, - "output": 14 + "input": 2.006, + "output": 2.992 }, "type": "chat" }, { - "id": "openai/o3-mini-high", - "name": "OpenAI o3-mini (High)", - "display_name": "OpenAI o3-mini (High)", + "id": "anthracite-org/magnum-v2-72b", + "name": "Magnum V2 72B", + "display_name": "Magnum V2 72B", "modalities": { "input": [ "text" @@ -20321,302 +19849,218 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 16384, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.64, - "output": 2.588 + "input": 2.006, + "output": 2.992 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "deepseek/deepseek-prover-v2-671b", + "name": "DeepSeek Prover v2 671B", + "display_name": "DeepSeek Prover v2 671B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 160000, "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2025-04-30", + "last_updated": "2025-04-30", "cost": { - "input": 0.1496, - "output": 0.595 + "input": 1, + "output": 2.5 }, "type": "chat" }, { - "id": "openai/o4-mini-deep-research", - "name": "OpenAI o4-mini Deep Research", - "display_name": "OpenAI o4-mini Deep Research", + "id": "deepseek/deepseek-v3.2-speciale", + "name": "DeepSeek V3.2 Speciale", + "display_name": "DeepSeek V3.2 Speciale", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 163000, + "output": 65536 }, "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 9.996, - "output": 19.992 + "input": 0.27999999999999997, + "output": 0.42000000000000004 }, "type": "chat" }, { - "id": "openai/gpt-5.1-chat", - "name": "GPT 5.1 Chat", - "display_name": "GPT 5.1 Chat", + "id": "deepseek/deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text", - "image" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 163000, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 1.25, - "output": 10 + "input": 0.27999999999999997, + "output": 0.42000000000000004 }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "OpenAI o4-mini", - "display_name": "OpenAI o4-mini", + "id": "deepseek/deepseek-v3.2:thinking", + "name": "DeepSeek V3.2 Thinking", + "display_name": "DeepSeek V3.2 Thinking", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 163000, + "output": 65536 }, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 1.1, - "output": 4.4 + "input": 0.27999999999999997, + "output": 0.42000000000000004 }, "type": "chat" }, { - "id": "openai/gpt-5.2-codex", - "name": "GPT 5.2 Codex", - "display_name": "GPT 5.2 Codex", + "id": "huihui-ai/DeepSeek-R1-Distill-Llama-70B-abliterated", + "name": "DeepSeek R1 Llama 70B Abliterated", + "display_name": "DeepSeek R1 Llama 70B Abliterated", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 1.75, - "output": 14 + "input": 0.7, + "output": 0.7 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-mini", - "name": "GPT 5.1 Codex Mini", - "display_name": "GPT 5.1 Codex Mini", + "id": "huihui-ai/Llama-3.1-Nemotron-70B-Instruct-HF-abliterated", + "name": "Nemotron 3.1 70B abliterated", + "display_name": "Nemotron 3.1 70B abliterated", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.25, - "output": 2 + "input": 0.7, + "output": 0.7 }, "type": "chat" }, { - "id": "openai/o1-preview", - "name": "OpenAI o1-preview", - "display_name": "OpenAI o1-preview", + "id": "huihui-ai/Qwen2.5-32B-Instruct-abliterated", + "name": "Qwen 2.5 32B Abliterated", + "display_name": "Qwen 2.5 32B Abliterated", "modalities": { "input": [ "text" @@ -20626,127 +20070,88 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 32768, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "release_date": "2025-01-06", + "last_updated": "2025-01-06", "cost": { - "input": 14.993999999999998, - "output": 59.993 + "input": 0.7, + "output": 0.7 }, "type": "chat" }, { - "id": "openai/gpt-4o-2024-08-06", - "name": "GPT-4o (2024-08-06)", - "display_name": "GPT-4o (2024-08-06)", + "id": "huihui-ai/DeepSeek-R1-Distill-Qwen-32B-abliterated", + "name": "DeepSeek R1 Qwen Abliterated", + "display_name": "DeepSeek R1 Qwen Abliterated", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 16384, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-08-06", - "last_updated": "2024-08-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 2.499, - "output": 9.996 + "input": 1.4, + "output": 1.4 }, "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "GPT 5.1", - "display_name": "GPT 5.1", + "id": "huihui-ai/Llama-3.3-70B-Instruct-abliterated", + "name": "Llama 3.3 70B Instruct abliterated", + "display_name": "Llama 3.3 70B Instruct abliterated", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 1.25, - "output": 10 + "input": 0.7, + "output": 0.7 }, "type": "chat" }, { - "id": "openai/o1", - "name": "OpenAI o1", - "display_name": "OpenAI o1", + "id": "ReadyArt/MS3.2-The-Omega-Directive-24B-Unslop-v2.0", + "name": "Omega Directive 24B Unslop v2.0", + "display_name": "Omega Directive 24B Unslop v2.0", "modalities": { "input": [ "text" @@ -20756,42 +20161,27 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 16384, + "output": 32768 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-12-17", - "last_updated": "2024-12-17", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 14.993999999999998, - "output": 59.993 + "input": 0.5, + "output": 0.5 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo", - "name": "GPT-3.5 Turbo", - "display_name": "GPT-3.5 Turbo", + "id": "ReadyArt/The-Omega-Abomination-L-70B-v1.0", + "name": "The Omega Abomination V1", + "display_name": "The Omega Abomination V1", "modalities": { "input": [ "text" @@ -20801,8 +20191,8 @@ ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -20810,18 +20200,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2022-11-30", - "last_updated": "2024-01-01", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.7, + "output": 0.95 }, "type": "chat" }, { - "id": "openai/o3-deep-research", - "name": "OpenAI o3 Deep Research", - "display_name": "OpenAI o3 Deep Research", + "id": "featherless-ai/Qwerky-72B", + "name": "Qwerky 72B", + "display_name": "Qwerky 72B", "modalities": { "input": [ "text" @@ -20831,42 +20221,27 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 32000, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2025-03-20", + "last_updated": "2025-03-20", "cost": { - "input": 9.996, - "output": 19.992 + "input": 0.5, + "output": 0.5 }, "type": "chat" }, { - "id": "openai/o3-mini", - "name": "OpenAI o3-mini", - "display_name": "OpenAI o3-mini", + "id": "meituan-longcat/LongCat-Flash-Chat-FP8", + "name": "LongCat Flash", + "display_name": "LongCat Flash", "modalities": { "input": [ "text" @@ -20876,42 +20251,27 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 32768 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "release_date": "2025-08-31", + "last_updated": "2025-08-31", "cost": { - "input": 1.1, - "output": 4.4 + "input": 0.15, + "output": 0.7 }, "type": "chat" }, { - "id": "openai/gpt-4-turbo-preview", - "name": "GPT-4 Turbo Preview", - "display_name": "GPT-4 Turbo Preview", + "id": "failspy/Meta-Llama-3-70B-Instruct-abliterated-v3.5", + "name": "Llama 3 70B abliterated", + "display_name": "Llama 3 70B abliterated", "modalities": { "input": [ "text" @@ -20921,8 +20281,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -20930,65 +20290,49 @@ }, "attachment": false, "open_weights": false, - "release_date": "2023-11-06", - "last_updated": "2024-01-01", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 9.996, - "output": 30.004999999999995 + "input": 0.7, + "output": 0.7 }, "type": "chat" }, { - "id": "openai/o1-pro", - "name": "OpenAI o1 Pro", - "display_name": "OpenAI o1 Pro", + "id": "meta-llama/llama-4-scout", + "name": "Llama 4 Scout", + "display_name": "Llama 4 Scout", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 328000, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-01-25", - "last_updated": "2025-01-25", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 150, - "output": 600 + "input": 0.085, + "output": 0.46 }, "type": "chat" }, { - "id": "openai/gpt-5-codex", - "name": "GPT-5 Codex", - "display_name": "GPT-5 Codex", + "id": "meta-llama/llama-3.2-90b-vision-instruct", + "name": "Llama 3.2 Medium", + "display_name": "Llama 3.2 Medium", "modalities": { "input": [ "text" @@ -20998,49 +20342,27 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 131072, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 9.996, - "output": 19.992 + "input": 0.9009999999999999, + "output": 0.9009999999999999 }, "type": "chat" }, { - "id": "openai/gpt-5.1-chat-latest", - "name": "GPT 5.1 Chat (Latest)", - "display_name": "GPT 5.1 Chat (Latest)", + "id": "meta-llama/llama-4-maverick", + "name": "Llama 4 Maverick", + "display_name": "Llama 4 Maverick", "modalities": { "input": [ "text", @@ -21051,63 +20373,60 @@ ] }, "limit": { - "context": 400000, - "output": 16384 + "context": 1048576, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 1.25, - "output": 10 + "input": 0.18000000000000002, + "output": 0.8 }, "type": "chat" }, { - "id": "openai/gpt-4o-search-preview", - "name": "GPT-4o Search Preview", - "display_name": "GPT-4o Search Preview", + "id": "meta-llama/llama-3.3-70b-instruct", + "name": "Llama 3.3 70b Instruct", + "display_name": "Llama 3.3 70b Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 16384 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "release_date": "2025-02-27", + "last_updated": "2025-02-27", "cost": { - "input": 1.47, - "output": 5.88 + "input": 0.05, + "output": 0.23 }, "type": "chat" }, { - "id": "openai/gpt-4.1-nano", - "name": "GPT 4.1 Nano", - "display_name": "GPT 4.1 Nano", + "id": "meta-llama/llama-3.2-3b-instruct", + "name": "Llama 3.2 3b Instruct", + "display_name": "Llama 3.2 3b Instruct", "modalities": { "input": [ "text", - "image", "pdf" ], "output": [ @@ -21115,8 +20434,8 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 131072, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -21124,18 +20443,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.0306, + "output": 0.0493 }, "type": "chat" }, { - "id": "openai/o4-mini-high", - "name": "OpenAI o4-mini high", - "display_name": "OpenAI o4-mini high", + "id": "meta-llama/llama-3.1-8b-instruct", + "name": "Llama 3.1 8b Instruct", + "display_name": "Llama 3.1 8b Instruct", "modalities": { "input": [ "text" @@ -21145,42 +20464,27 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 1.1, - "output": 4.4 + "input": 0.0544, + "output": 0.0544 }, "type": "chat" }, { - "id": "openai/o3", - "name": "OpenAI o3", - "display_name": "OpenAI o3", + "id": "VongolaChouko/Starcannon-Unleashed-12B-v1.0", + "name": "Mistral Nemo Starcannon 12b v1", + "display_name": "Mistral Nemo Starcannon 12b v1", "modalities": { "input": [ "text" @@ -21190,42 +20494,27 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 16384, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 2, - "output": 8 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "arcee-ai/trinity-mini", + "name": "Trinity Mini", + "display_name": "Trinity Mini", "modalities": { "input": [ "text" @@ -21235,80 +20524,57 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.04, + "input": 0.045000000000000005, "output": 0.15 }, "type": "chat" }, { - "id": "openai/gpt-5-pro", - "name": "GPT 5 Pro", - "display_name": "GPT 5 Pro", + "id": "arcee-ai/trinity-large", + "name": "Trinity Large", + "display_name": "Trinity Large", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 15, - "output": 120 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "openai/gpt-5.1-2025-11-13", - "name": "GPT-5.1 (2025-11-13)", - "display_name": "GPT-5.1 (2025-11-13)", + "id": "meganova-ai/manta-flash-1.0", + "name": "Manta Flash 1.0", + "display_name": "Manta Flash 1.0", "modalities": { "input": [ "text" @@ -21318,80 +20584,57 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-12-20", + "last_updated": "2025-12-20", "cost": { - "input": 1.25, - "output": 10 + "input": 0.02, + "output": 0.16 }, "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "meganova-ai/manta-pro-1.0", + "name": "Manta Pro 1.0", + "display_name": "Manta Pro 1.0", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 32768 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "release_date": "2025-12-20", + "last_updated": "2025-12-20", "cost": { - "input": 2.499, - "output": 9.996 + "input": 0.060000000000000005, + "output": 0.5 }, "type": "chat" }, { - "id": "openai/o3-mini-low", - "name": "OpenAI o3-mini (Low)", - "display_name": "OpenAI o3-mini (Low)", + "id": "meganova-ai/manta-mini-1.0", + "name": "Manta Mini 1.0", + "display_name": "Manta Mini 1.0", "modalities": { "input": [ "text" @@ -21401,96 +20644,57 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "release_date": "2025-12-20", + "last_updated": "2025-12-20", "cost": { - "input": 9.996, - "output": 19.992 + "input": 0.02, + "output": 0.16 }, "type": "chat" }, { - "id": "openai/gpt-5", - "name": "GPT 5", - "display_name": "GPT 5", + "id": "LatitudeGames/Wayfarer-Large-70B-Llama-3.3", + "name": "Llama 3.3 70B Wayfarer", + "display_name": "Llama 3.3 70B Wayfarer", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-02-20", + "last_updated": "2025-02-20", "cost": { - "input": 1.25, - "output": 10 + "input": 0.700000007, + "output": 0.700000007 }, "type": "chat" }, { - "id": "openai/gpt-oss-safeguard-20b", - "name": "GPT OSS Safeguard 20B", - "display_name": "GPT OSS Safeguard 20B", + "id": "essentialai/rnj-1-instruct", + "name": "RNJ-1 Instruct 8B", + "display_name": "RNJ-1 Instruct 8B", "modalities": { "input": [ "text" @@ -21501,27 +20705,26 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-10-29", - "last_updated": "2025-10-29", + "release_date": "2025-12-13", + "last_updated": "2025-12-13", "cost": { - "input": 0.075, - "output": 0.3 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "openai/o3-pro-2025-06-10", - "name": "OpenAI o3-pro (2025-06-10)", - "display_name": "OpenAI o3-pro (2025-06-10)", + "id": "abacusai/Dracarys-72B-Instruct", + "name": "Llama 3.1 70B Dracarys 2", + "display_name": "Llama 3.1 70B Dracarys 2", "modalities": { "input": [ "text" @@ -21531,142 +20734,130 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 16384, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-06-10", - "last_updated": "2025-06-10", + "release_date": "2025-08-02", + "last_updated": "2025-08-02", "cost": { - "input": 9.996, - "output": 19.992 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "alibaba/qwen3.6-flash", + "name": "Qwen3.6 Flash", + "display_name": "Qwen3.6 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 991800, + "output": 65536 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.05, - "output": 0.25 + "input": 0.19, + "output": 1.16 }, "type": "chat" }, { - "id": "openai/gpt-5-chat-latest", - "name": "GPT 5 Chat", - "display_name": "GPT 5 Chat", + "id": "MiniMaxAI/MiniMax-M1-80k", + "name": "MiniMax M1 80K", + "display_name": "MiniMax M1 80K", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 131072 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-06-16", + "last_updated": "2025-06-16", "cost": { - "input": 1.25, - "output": 10 + "input": 0.6052, + "output": 2.4225000000000003 }, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "GPT 4.1", - "display_name": "GPT 4.1", + "id": "allenai/olmo-3.1-32b-instruct", + "name": "Olmo 3.1 32B Instruct", + "display_name": "Olmo 3.1 32B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 65536, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-10", - "last_updated": "2025-09-10", + "release_date": "2026-01-25", + "last_updated": "2026-01-25", "cost": { - "input": 2, - "output": 8 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT 4.1 Mini", - "display_name": "GPT 4.1 Mini", + "id": "allenai/molmo-2-8b", + "name": "Molmo 2 8B", + "display_name": "Molmo 2 8B", "modalities": { "input": [ "text", @@ -21677,8 +20868,8 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 36864, + "output": 36864 }, "tool_call": false, "reasoning": { @@ -21686,75 +20877,52 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "cost": { - "input": 0.4, - "output": 1.6 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex", - "name": "GPT 5.1 Codex", - "display_name": "GPT 5.1 Codex", + "id": "allenai/olmo-3.1-32b-think", + "name": "Olmo 3.1 32B Think", + "display_name": "Olmo 3.1 32B Think", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 65536, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2026-01-25", + "last_updated": "2026-01-25", "cost": { - "input": 1.25, - "output": 10 + "input": 0.15, + "output": 0.5 }, "type": "chat" }, { - "id": "openai/gpt-4o-2024-11-20", - "name": "GPT-4o (2024-11-20)", - "display_name": "GPT-4o (2024-11-20)", + "id": "allenai/olmo-3-32b-think", + "name": "Olmo 3 32B Think", + "display_name": "Olmo 3 32B Think", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -21762,26 +20930,27 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-11-20", - "last_updated": "2024-11-20", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { - "input": 2.5, - "output": 10 + "input": 0.3, + "output": 0.44999999999999996 }, "type": "chat" }, { - "id": "VongolaChouko/Starcannon-Unleashed-12B-v1.0", - "name": "Mistral Nemo Starcannon 12b v1", - "display_name": "Mistral Nemo Starcannon 12b v1", + "id": "cognitivecomputations/dolphin-2.9.2-qwen2-72b", + "name": "Dolphin 72b", + "display_name": "Dolphin 72b", "modalities": { "input": [ "text" @@ -21791,8 +20960,8 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 8192, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -21800,18 +20969,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "release_date": "2025-02-27", + "last_updated": "2025-02-27", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "amazon/nova-lite-v1", - "name": "Amazon Nova Lite 1.0", - "display_name": "Amazon Nova Lite 1.0", + "id": "Steelskull/L3.3-Electra-R1-70b", + "name": "Steelskull Electra R1 70b", + "display_name": "Steelskull Electra R1 70b", "modalities": { "input": [ "text" @@ -21821,8 +20990,8 @@ ] }, "limit": { - "context": 300000, - "output": 5120 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -21830,18 +20999,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.0595, - "output": 0.238 + "input": 0.69989, + "output": 0.69989 }, "type": "chat" }, { - "id": "amazon/nova-pro-v1", - "name": "Amazon Nova Pro 1.0", - "display_name": "Amazon Nova Pro 1.0", + "id": "Steelskull/L3.3-MS-Nevoria-70b", + "name": "Steelskull Nevoria 70b", + "display_name": "Steelskull Nevoria 70b", "modalities": { "input": [ "text" @@ -21851,8 +21020,8 @@ ] }, "limit": { - "context": 300000, - "output": 32000 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -21860,18 +21029,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.7989999999999999, - "output": 3.1959999999999997 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "amazon/nova-2-lite-v1", - "name": "Amazon Nova 2 Lite", - "display_name": "Amazon Nova 2 Lite", + "id": "Steelskull/L3.3-Nevoria-R1-70b", + "name": "Steelskull Nevoria R1 70b", + "display_name": "Steelskull Nevoria R1 70b", "modalities": { "input": [ "text" @@ -21881,8 +21050,8 @@ ] }, "limit": { - "context": 1000000, - "output": 65535 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -21890,18 +21059,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.5099999999999999, - "output": 4.25 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "amazon/nova-micro-v1", - "name": "Amazon Nova Micro 1.0", - "display_name": "Amazon Nova Micro 1.0", + "id": "Steelskull/L3.3-MS-Evayale-70B", + "name": "Evayale 70b ", + "display_name": "Evayale 70b ", "modalities": { "input": [ "text" @@ -21911,8 +21080,8 @@ ] }, "limit": { - "context": 128000, - "output": 5120 + "context": 16384, + "output": 16384 }, "tool_call": false, "reasoning": { @@ -21920,18 +21089,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.0357, - "output": 0.1394 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "Sao10K/L3.3-70B-Euryale-v2.3", - "name": "Llama 3.3 70B Euryale", - "display_name": "Llama 3.3 70B Euryale", + "id": "Steelskull/L3.3-MS-Evalebis-70b", + "name": "MS Evalebis 70b", + "display_name": "MS Evalebis 70b", "modalities": { "input": [ "text" @@ -21941,7 +21110,7 @@ ] }, "limit": { - "context": 20480, + "context": 16384, "output": 16384 }, "tool_call": false, @@ -21959,9 +21128,9 @@ "type": "chat" }, { - "id": "Sao10K/L3.1-70B-Euryale-v2.2", - "name": "Llama 3.1 70B Euryale", - "display_name": "Llama 3.1 70B Euryale", + "id": "Steelskull/L3.3-Cu-Mai-R1-70b", + "name": "Llama 3.3 70B Cu Mai", + "display_name": "Llama 3.3 70B Cu Mai", "modalities": { "input": [ "text" @@ -21971,7 +21140,7 @@ ] }, "limit": { - "context": 20480, + "context": 16384, "output": 16384 }, "tool_call": false, @@ -21980,18 +21149,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.306, - "output": 0.357 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "Sao10K/L3.1-70B-Hanami-x1", - "name": "Llama 3.1 70B Hanami", - "display_name": "Llama 3.1 70B Hanami", + "id": "dmind/dmind-1", + "name": "DMind-1", + "display_name": "DMind-1", "modalities": { "input": [ "text" @@ -22001,8 +21170,8 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 32768, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -22010,18 +21179,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.3, + "output": 0.6 }, "type": "chat" }, { - "id": "Sao10K/L3-8B-Stheno-v3.2", - "name": "Sao10K Stheno 8b", - "display_name": "Sao10K Stheno 8b", + "id": "dmind/dmind-1-mini", + "name": "DMind-1-Mini", + "display_name": "DMind-1-Mini", "modalities": { "input": [ "text" @@ -22031,7 +21200,7 @@ ] }, "limit": { - "context": 16384, + "context": 32768, "output": 8192 }, "tool_call": false, @@ -22040,18 +21209,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-11-29", - "last_updated": "2024-11-29", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 0.2006, - "output": 0.2006 + "input": 0.2, + "output": 0.4 }, "type": "chat" }, { - "id": "LatitudeGames/Wayfarer-Large-70B-Llama-3.3", - "name": "Llama 3.3 70B Wayfarer", - "display_name": "Llama 3.3 70B Wayfarer", + "id": "xiaomi/mimo-v2-flash-thinking-original", + "name": "MiMo V2 Flash (Thinking) Original", + "display_name": "MiMo V2 Flash (Thinking) Original", "modalities": { "input": [ "text" @@ -22061,8 +21230,8 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 256000, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -22070,18 +21239,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-02-20", - "last_updated": "2025-02-20", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.700000007, - "output": 0.700000007 + "input": 0.102, + "output": 0.306 }, "type": "chat" }, { - "id": "z-ai/glm-4.6:thinking", - "name": "GLM 4.6 Thinking", - "display_name": "GLM 4.6 Thinking", + "id": "xiaomi/mimo-v2-flash", + "name": "MiMo V2 Flash", + "display_name": "MiMo V2 Flash", "modalities": { "input": [ "text" @@ -22091,60 +21260,57 @@ ] }, "limit": { - "context": 200000, - "output": 65535 + "context": 256000, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.4, - "output": 1.5 + "input": 0.102, + "output": 0.306 }, "type": "chat" }, { - "id": "z-ai/glm-4.5v", - "name": "GLM 4.5V", - "display_name": "GLM 4.5V", + "id": "xiaomi/mimo-v2-flash-thinking", + "name": "MiMo V2 Flash (Thinking)", + "display_name": "MiMo V2 Flash (Thinking)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 96000 + "context": 256000, + "output": 32768 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-22", - "last_updated": "2025-11-22", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.6, - "output": 1.7999999999999998 + "input": 0.102, + "output": 0.306 }, "type": "chat" }, { - "id": "z-ai/glm-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "xiaomi/mimo-v2-flash-original", + "name": "MiMo V2 Flash Original", + "display_name": "MiMo V2 Flash Original", "modalities": { "input": [ "text" @@ -22154,58 +21320,50 @@ ] }, "limit": { - "context": 200000, - "output": 65535 + "context": 256000, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.4, - "output": 1.5 + "input": 0.102, + "output": 0.306 }, "type": "chat" }, { - "id": "z-ai/glm-4.5v:thinking", - "name": "GLM 4.5V Thinking", - "display_name": "GLM 4.5V Thinking", + "id": "baidu/ernie-4.5-300b-a47b", + "name": "ERNIE 4.5 300B", + "display_name": "ERNIE 4.5 300B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 96000 + "context": 131072, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-22", - "last_updated": "2025-11-22", + "release_date": "2025-06-30", + "last_updated": "2025-06-30", "cost": { - "input": 0.6, - "output": 1.7999999999999998 + "input": 0.35, + "output": 1.15 }, "type": "chat" }, @@ -22241,9 +21399,9 @@ "type": "chat" }, { - "id": "baidu/ernie-4.5-300b-a47b", - "name": "ERNIE 4.5 300B", - "display_name": "ERNIE 4.5 300B", + "id": "stepfun-ai/step-3.5-flash", + "name": "Step 3.5 Flash", + "display_name": "Step 3.5 Flash", "modalities": { "input": [ "text" @@ -22253,27 +21411,28 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 256000, + "output": 256000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-06-30", - "last_updated": "2025-06-30", + "release_date": "2026-02-02", + "last_updated": "2026-02-02", "cost": { - "input": 0.35, - "output": 1.15 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "dmind/dmind-1", - "name": "DMind-1", - "display_name": "DMind-1", + "id": "stepfun-ai/step-3.5-flash:thinking", + "name": "Step 3.5 Flash Thinking", + "display_name": "Step 3.5 Flash Thinking", "modalities": { "input": [ "text" @@ -22283,27 +21442,28 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 256000, + "output": 256000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "release_date": "2026-02-02", + "last_updated": "2026-02-02", "cost": { - "input": 0.3, - "output": 0.6 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "dmind/dmind-1-mini", - "name": "DMind-1-Mini", - "display_name": "DMind-1-Mini", + "id": "miromind-ai/mirothinker-v1.5-235b", + "name": "MiroThinker v1.5 235B", + "display_name": "MiroThinker v1.5 235B", "modalities": { "input": [ "text" @@ -22314,7 +21474,7 @@ }, "limit": { "context": 32768, - "output": 8192 + "output": 4000 }, "tool_call": false, "reasoning": { @@ -22322,18 +21482,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "release_date": "2026-01-07", + "last_updated": "2026-01-07", "cost": { - "input": 0.2, - "output": 0.4 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "Infermatic/MN-12B-Inferor-v0.0", - "name": "Mistral Nemo Inferor 12B", - "display_name": "Mistral Nemo Inferor 12B", + "id": "tngtech/tng-r1t-chimera", + "name": "TNG R1T Chimera", + "display_name": "TNG R1T Chimera", "modalities": { "input": [ "text" @@ -22343,8 +21503,8 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 128000, + "output": 65536 }, "tool_call": false, "reasoning": { @@ -22352,18 +21512,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "release_date": "2025-11-26", + "last_updated": "2025-11-26", "cost": { - "input": 0.25499999999999995, - "output": 0.49299999999999994 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "meituan-longcat/LongCat-Flash-Chat-FP8", - "name": "LongCat Flash", - "display_name": "LongCat Flash", + "id": "tngtech/DeepSeek-TNG-R1T2-Chimera", + "name": "DeepSeek TNG R1T2 Chimera", + "display_name": "DeepSeek TNG R1T2 Chimera", "modalities": { "input": [ "text" @@ -22374,26 +21534,35 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-31", - "last_updated": "2025-08-31", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.15, - "output": 0.7 + "input": 0.31, + "output": 0.31 }, "type": "chat" - }, + } + ] + }, + "io-net": { + "id": "io-net", + "name": "IO.NET", + "display_name": "IO.NET", + "api": "https://api.intelligence.io.solutions/api/v1", + "doc": "https://io.net/docs/guides/intelligence/io-intelligence", + "models": [ { - "id": "meganova-ai/manta-mini-1.0", - "name": "Manta Mini 1.0", - "display_name": "Manta Mini 1.0", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ "text" @@ -22403,27 +21572,43 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-20", - "last_updated": "2025-12-20", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-28", "cost": { - "input": 0.02, - "output": 0.16 + "input": 2, + "output": 8.75, + "cache_read": 1, + "cache_write": 4 }, "type": "chat" }, { - "id": "meganova-ai/manta-pro-1.0", - "name": "Manta Pro 1.0", - "display_name": "Manta Pro 1.0", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -22434,26 +21619,42 @@ }, "limit": { "context": 32768, - "output": 32768 + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-12-20", - "last_updated": "2025-12-20", + "knowledge": "2024-08", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.060000000000000005, - "output": 0.5 + "input": 0.55, + "output": 2.25, + "cache_read": 0.275, + "cache_write": 1.1 }, "type": "chat" }, { - "id": "meganova-ai/manta-flash-1.0", - "name": "Manta Flash 1.0", - "display_name": "Manta Flash 1.0", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -22463,27 +21664,31 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 32768, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-12-20", - "last_updated": "2025-12-20", + "knowledge": "2024-08", + "release_date": "2024-09-05", + "last_updated": "2024-09-05", "cost": { - "input": 0.02, - "output": 0.16 + "input": 0.39, + "output": 1.9, + "cache_read": 0.195, + "cache_write": 0.78 }, "type": "chat" }, { - "id": "minimax/minimax-m2.7", - "name": "MiniMax M2.7", - "display_name": "MiniMax M2.7", + "id": "openai/gpt-oss-20b", + "name": "GPT-OSS 20B", + "display_name": "GPT-OSS 20B", "modalities": { "input": [ "text" @@ -22493,70 +21698,75 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 64000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.03, + "output": 0.14, + "cache_read": 0.015, + "cache_write": 0.06 }, "type": "chat" }, { - "id": "minimax/minimax-01", - "name": "MiniMax 01", - "display_name": "MiniMax 01", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS 120B", + "display_name": "GPT-OSS 120B", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000192, - "output": 16384 + "context": 131072, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-01-15", - "last_updated": "2025-01-15", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.1394, - "output": 1.1219999999999999 + "input": 0.04, + "output": 0.4, + "cache_read": 0.02, + "cache_write": 0.08 }, "type": "chat" }, { - "id": "minimax/minimax-m2.1", - "name": "MiniMax M2.1", - "display_name": "MiniMax M2.1", + "id": "zai-org/GLM-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ "text" @@ -22567,12 +21777,12 @@ }, "limit": { "context": 200000, - "output": 131072 + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -22581,18 +21791,21 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-19", - "last_updated": "2025-12-19", + "knowledge": "2024-10", + "release_date": "2024-11-15", + "last_updated": "2024-11-15", "cost": { - "input": 0.33, - "output": 1.32 + "input": 0.4, + "output": 1.75, + "cache_read": 0.2, + "cache_write": 0.8 }, "type": "chat" }, { - "id": "minimax/minimax-m2-her", - "name": "MiniMax M2-her", - "display_name": "MiniMax M2-her", + "id": "Intel/Qwen3-Coder-480B-A35B-Instruct-int4-mixed-ar", + "name": "Qwen 3 Coder 480B", + "display_name": "Qwen 3 Coder 480B", "modalities": { "input": [ "text" @@ -22602,27 +21815,31 @@ ] }, "limit": { - "context": 65532, - "output": 2048 + "context": 106000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-01-24", - "last_updated": "2026-01-24", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-15", + "last_updated": "2025-01-15", "cost": { - "input": 0.30200000000000005, - "output": 1.2069999999999999 + "input": 0.22, + "output": 0.95, + "cache_read": 0.11, + "cache_write": 0.44 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "mistralai/Devstral-Small-2505", + "name": "Devstral Small 2505", + "display_name": "Devstral Small 2505", "modalities": { "input": [ "text" @@ -22632,163 +21849,100 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2024-12", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.05, + "output": 0.22, + "cache_read": 0.025, + "cache_write": 0.1 }, "type": "chat" }, { - "id": "qwen/Qwen3.6-35B-A3B:thinking", - "name": "Qwen3.6 35B A3B Thinking", - "display_name": "Qwen3.6 35B A3B Thinking", + "id": "mistralai/Mistral-Large-Instruct-2411", + "name": "Mistral Large Instruct 2411", + "display_name": "Mistral Large Instruct 2411", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-19", - "last_updated": "2026-04-21", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.29, - "output": 1.74 + "input": 2, + "output": 6, + "cache_read": 1, + "cache_write": 4 }, "type": "chat" }, { - "id": "qwen/qwen3.5-397b-a17b", - "name": "Qwen3.5 397B A17B", - "display_name": "Qwen3.5 397B A17B", + "id": "mistralai/Mistral-Nemo-Instruct-2407", + "name": "Mistral Nemo Instruct 2407", + "display_name": "Mistral Nemo Instruct 2407", "modalities": { "input": [ - "text", - "image", - "video" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 258048, - "output": 65536 - }, - "tool_call": false, - "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-16", - "last_updated": "2026-02-16", - "cost": { - "input": 0.6, - "output": 3.6 - }, - "type": "chat" - }, - { - "id": "qwen/Qwen3.6-35B-A3B", - "name": "Qwen3.6 35B A3B", - "display_name": "Qwen3.6 35B A3B", - "modalities": { - "input": [ - "text", - "image", - "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-04-17", - "last_updated": "2026-04-21", + "knowledge": "2024-05", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.29, - "output": 1.74 + "input": 0.02, + "output": 0.04, + "cache_read": 0.01, + "cache_write": 0.04 }, "type": "chat" }, { - "id": "unsloth/gemma-3-1b-it", - "name": "Gemma 3 1B IT", - "display_name": "Gemma 3 1B IT", + "id": "mistralai/Magistral-Small-2506", + "name": "Magistral Small 2506", + "display_name": "Magistral Small 2506", "modalities": { "input": [ "text" @@ -22799,61 +21953,68 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", + "knowledge": "2025-01", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 0.1003, - "output": 0.1003 + "input": 0.5, + "output": 1.5, + "cache_read": 0.25, + "cache_write": 1 }, "type": "chat" }, { - "id": "unsloth/gemma-3-12b-it", - "name": "Gemma 3 12B IT", - "display_name": "Gemma 3 12B IT", + "id": "meta-llama/Llama-3.2-90B-Vision-Instruct", + "name": "Llama 3.2 90B Vision Instruct", + "display_name": "Llama 3.2 90B Vision Instruct", "modalities": { "input": [ "text", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 131072 + "context": 16000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.272, - "output": 0.272 + "input": 0.35, + "output": 0.4, + "cache_read": 0.175, + "cache_write": 0.7 }, "type": "chat" }, { - "id": "unsloth/gemma-3-4b-it", - "name": "Gemma 3 4B IT", - "display_name": "Gemma 3 4B IT", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" @@ -22861,57 +22022,65 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.2006, - "output": 0.2006 + "input": 0.13, + "output": 0.38, + "cache_read": 0.065, + "cache_write": 0.26 }, "type": "chat" }, { - "id": "unsloth/gemma-3-27b-it", - "name": "Gemma 3 27B IT", - "display_name": "Gemma 3 27B IT", + "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", + "name": "Llama 4 Maverick 17B 128E Instruct", + "display_name": "Llama 4 Maverick 17B 128E Instruct", "modalities": { "input": [ "text", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 96000 + "context": 430000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-15", + "last_updated": "2025-01-15", "cost": { - "input": 0.2992, - "output": 0.2992 + "input": 0.15, + "output": 0.6, + "cache_read": 0.075, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-9B-0414", - "name": "GLM Z1 9B 0414", - "display_name": "GLM Z1 9B 0414", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen 3 235B Thinking", + "display_name": "Qwen 3 235B Thinking", "modalities": { "input": [ "text" @@ -22921,27 +22090,43 @@ ] }, "limit": { - "context": 32000, - "output": 8000 + "context": 262144, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.11, + "output": 0.6, + "cache_read": 0.055, + "cache_write": 0.22 }, "type": "chat" }, { - "id": "THUDM/GLM-4-9B-0414", - "name": "GLM 4 9B 0414", - "display_name": "GLM 4 9B 0414", + "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen 3 Next 80B Instruct", + "display_name": "Qwen 3 Next 80B Instruct", "modalities": { "input": [ "text" @@ -22951,30 +22136,35 @@ ] }, "limit": { - "context": 32000, - "output": 8000 + "context": 262144, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-10", + "last_updated": "2025-01-10", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.1, + "output": 0.8, + "cache_read": 0.05, + "cache_write": 0.2 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-Rumination-32B-0414", - "name": "GLM Z1 Rumination 32B 0414", - "display_name": "GLM Z1 Rumination 32B 0414", + "id": "Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen 2.5 VL 32B Instruct", + "display_name": "Qwen 2.5 VL 32B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -22982,26 +22172,39 @@ }, "limit": { "context": 32000, - "output": 65536 + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "open_weights": true, + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.05, + "output": 0.22, + "cache_read": 0.025, + "cache_write": 0.1 }, "type": "chat" - }, + } + ] + }, + "inception": { + "id": "inception", + "name": "Inception", + "display_name": "Inception", + "api": "https://api.inceptionlabs.ai/v1/", + "doc": "https://platform.inceptionlabs.ai/docs", + "models": [ { - "id": "THUDM/GLM-4-32B-0414", - "name": "GLM 4 32B 0414", - "display_name": "GLM 4 32B 0414", + "id": "mercury-edit-2", + "name": "Mercury Edit 2", + "display_name": "Mercury Edit 2", "modalities": { "input": [ "text" @@ -23012,26 +22215,29 @@ }, "limit": { "context": 128000, - "output": 65536 + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2026-03-30", + "last_updated": "2026-03-30", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.25, + "output": 0.75, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-32B-0414", - "name": "GLM Z1 32B 0414", - "display_name": "GLM Z1 32B 0414", + "id": "mercury-2", + "name": "Mercury 2", + "display_name": "Mercury 2", "modalities": { "input": [ "text" @@ -23042,39 +22248,52 @@ }, "limit": { "context": 128000, - "output": 65536 + "output": 50000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "knowledge": "2025-01-01", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.25, + "output": 0.75, + "cache_read": 0.025 }, "type": "chat" - }, + } + ] + }, + "submodel": { + "id": "submodel", + "name": "submodel", + "display_name": "submodel", + "api": "https://llm.submodel.ai/v1", + "doc": "https://submodel.gitbook.io", + "models": [ { - "id": "google/gemini-3-flash-preview", - "name": "Gemini 3 Flash (Preview)", - "display_name": "Gemini 3 Flash (Preview)", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 75000, + "output": 163840 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -23083,36 +22302,28 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { "input": 0.5, - "output": 3 + "output": 2.15 }, "type": "chat" }, { - "id": "google/gemini-flash-1.5", - "name": "Gemini 1.5 Flash", - "display_name": "Gemini 1.5 Flash", + "id": "deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text" @@ -23122,120 +22333,97 @@ ] }, "limit": { - "context": 2000000, - "output": 8192 + "context": 75000, + "output": 163840 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2024-05-14", - "last_updated": "2024-05-14", + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.0748, - "output": 0.306 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "google/gemini-3-flash-preview-thinking", - "name": "Gemini 3 Flash Thinking", - "display_name": "Gemini 3 Flash Thinking", + "id": "deepseek-ai/DeepSeek-V3-0324", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 75000, + "output": 163840 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.5, - "output": 3 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 131072, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-01-26", - "last_updated": "2026-01-26", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.3, - "output": 1.9 + "input": 0.1, + "output": 0.5 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "zai-org/GLM-4.5-Air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", "modalities": { "input": [ "text" @@ -23245,27 +22433,28 @@ ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 131072, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "open_weights": true, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { "input": 0.1, - "output": 2 + "output": 0.5 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking-original", - "name": "Kimi K2 Thinking Original", - "display_name": "Kimi K2 Thinking Original", + "id": "zai-org/GLM-4.5-FP8", + "name": "GLM 4.5 FP8", + "display_name": "GLM 4.5 FP8", "modalities": { "input": [ "text" @@ -23275,28 +22464,29 @@ ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "open_weights": true, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.6, - "output": 2.5 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-instruct-0711", - "name": "Kimi K2 0711", - "display_name": "Kimi K2 0711", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -23306,58 +22496,71 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 262144 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.1, - "output": 2 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "moonshotai/Kimi-Dev-72B", - "name": "Kimi Dev 72B", - "display_name": "Kimi Dev 72B", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 262144, "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.4, - "output": 0.4 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking-turbo-original", - "name": "Kimi K2 Thinking Turbo Original", - "display_name": "Kimi K2 Thinking Turbo Original", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -23367,28 +22570,37 @@ ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 262144, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "open_weights": true, + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 1.15, - "output": 8 + "input": 0.2, + "output": 0.3 }, "type": "chat" - }, + } + ] + }, + "requesty": { + "id": "requesty", + "name": "Requesty", + "display_name": "Requesty", + "api": "https://router.requesty.ai/v1", + "doc": "https://requesty.ai/solution/llm-routing/models", + "models": [ { - "id": "moonshotai/kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "openai/gpt-5.1-codex-mini", + "name": "GPT-5.1-Codex-Mini", + "display_name": "GPT-5.1-Codex-Mini", "modalities": { "input": [ "text", @@ -23399,32 +22611,52 @@ ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 400000, + "output": 100000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-16", - "last_updated": "2026-04-21", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.53, - "output": 2.73 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.6:thinking", - "name": "Kimi K2.6 Thinking", - "display_name": "Kimi K2.6 Thinking", + "id": "openai/gpt-5.2-pro", + "name": "GPT-5.2 Pro", + "display_name": "GPT-5.2 Pro", "modalities": { "input": [ "text", @@ -23435,99 +22667,106 @@ ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 400000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-16", - "last_updated": "2026-04-21", - "cost": { - "input": 0.53, - "output": 2.73 - }, - "type": "chat" - }, - { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 262144 - }, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.4, - "output": 2 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "openai/gpt-5-codex", + "name": "GPT-5 Codex", + "display_name": "GPT-5 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 262144 + "context": 400000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "knowledge": "2024-10-01", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.3, - "output": 1.2 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.5:thinking", - "name": "Kimi K2.5 Thinking", - "display_name": "Kimi K2.5 Thinking", + "id": "openai/gpt-5.1-chat", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", "modalities": { "input": [ "text", @@ -23538,9 +22777,10 @@ ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 128000, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -23548,108 +22788,147 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-01-26", - "last_updated": "2026-01-26", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.3, - "output": 1.9 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "Tongyi-Zhiwen/QwenLong-L1-32B", - "name": "QwenLong L1 32B", - "display_name": "QwenLong L1 32B", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1 Mini", + "display_name": "GPT-4.1 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 40960 - }, - "tool_call": false, + "context": 1047576, + "output": 32768 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-25", - "last_updated": "2025-01-25", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.13999999999999999, - "output": 0.6 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "nothingiisreal/L3.1-70B-Celeste-V0.1-BF16", - "name": "Llama 3.1 70B Celeste v0.1", - "display_name": "Llama 3.1 70B Celeste v0.1", + "id": "openai/gpt-5-image", + "name": "GPT-5 Image", + "display_name": "GPT-5 Image", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2024-10-01", + "release_date": "2025-10-14", + "last_updated": "2025-10-14", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "aion-labs/aion-1.0", - "name": "Aion 1.0", - "display_name": "Aion 1.0", + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-02-01", - "last_updated": "2025-02-01", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 3.995, - "output": 7.99 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "aion-labs/aion-rp-llama-3.1-8b", - "name": "Llama 3.1 8b (uncensored)", - "display_name": "Llama 3.1 8b (uncensored)", + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ "text" @@ -23659,131 +22938,212 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 16000, + "output": 4000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.2006, - "output": 0.2006 + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "aion-labs/aion-1.0-mini", - "name": "Aion 1.0 mini (DeepSeek)", - "display_name": "Aion 1.0 mini (DeepSeek)", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o Mini", + "display_name": "GPT-4o Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-02-20", - "last_updated": "2025-02-20", + "knowledge": "2024-10", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.7989999999999999, - "output": 1.394 + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "Alibaba-NLP/Tongyi-DeepResearch-30B-A3B", - "name": "Tongyi DeepResearch 30B A3B", - "display_name": "Tongyi DeepResearch 30B A3B", + "id": "openai/gpt-5.1-codex-max", + "name": "GPT-5.1-Codex-Max", + "display_name": "GPT-5.1-Codex-Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.08, - "output": 0.24000000000000002 + "input": 1.1, + "output": 9, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M1-80k", - "name": "MiniMax M1 80K", - "display_name": "MiniMax M1 80K", + "id": "openai/gpt-5.4-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 1050000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-06-16", - "last_updated": "2025-06-16", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.6052, - "output": 2.4225000000000003 + "input": 30, + "output": 180, + "cache_read": 30 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6:thinking:low", - "name": "Claude 4.6 Opus Thinking Low", - "display_name": "Claude 4.6 Opus Thinking Low", + "id": "openai/o4-mini", + "name": "o4 Mini", + "display_name": "o4 Mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 200000, + "output": 100000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -23793,56 +23153,46 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, + "mode": "effort", "effort": "medium", "effort_options": [ "low", "medium", "high" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2024-06", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 4.998, - "output": 25.007 + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6", - "name": "Claude 4.6 Opus", - "display_name": "Claude 4.6 Opus", + "id": "openai/gpt-5.1-codex", + "name": "GPT-5.1-Codex", + "display_name": "GPT-5.1-Codex", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -23852,56 +23202,53 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", + "mode": "effort", + "effort": "none", "effort_options": [ + "none", "low", "medium", "high" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 4.998, - "output": 25.007 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.6:thinking", - "name": "Claude Sonnet 4.6 Thinking", - "display_name": "Claude Sonnet 4.6 Thinking", + "id": "openai/gpt-5.2-codex", + "name": "GPT-5.2-Codex", + "display_name": "GPT-5.2-Codex", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -23911,57 +23258,87 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, + "mode": "effort", "effort": "medium", "effort_options": [ "low", "medium", - "high" + "high", + "xhigh" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 2.992, - "output": 14.993999999999998 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6:thinking:max", - "name": "Claude 4.6 Opus Thinking Max", - "display_name": "Claude 4.6 Opus Thinking Max", + "id": "openai/gpt-5-chat", + "name": "GPT-5 Chat (latest)", + "display_name": "GPT-5 Chat (latest)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.25, + "output": 10 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32000 + }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -23971,42 +23348,39 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, + "mode": "effort", "effort": "medium", "effort_options": [ + "minimal", "low", "medium", "high" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 4.998, - "output": 25.007 + "input": 0.25, + "output": 2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6:thinking:medium", - "name": "Claude 4.6 Opus Thinking Medium", - "display_name": "Claude 4.6 Opus Thinking Medium", + "id": "openai/gpt-5.3-codex", + "name": "GPT-5.3-Codex", + "display_name": "GPT-5.3-Codex", "modalities": { "input": [ "text", @@ -24018,9 +23392,10 @@ ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -24030,42 +23405,198 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", + "modalities": { + "input": [ + "text", + "audio", + "image", + "video" + ], + "output": [ + "text", + "audio", + "image" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", "effort": "medium", "effort_options": [ + "minimal", "low", "medium", "high" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.13 + }, + "type": "chat" + }, + { + "id": "anthropic/claude-3-7-sonnet", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", "continuation": [ "thinking_blocks" ], "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + "Anthropic uses thinking budget tokens" ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2024-01", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 4.998, - "output": 25.007 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "anthropic/claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 62000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-01", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "cost": { + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + }, + "type": "chat" + }, + { + "id": "anthropic/claude-opus-4", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ "text", @@ -24076,10 +23607,47 @@ "text" ] }, + "limit": { + "context": 200000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + }, + "type": "chat" + }, + { + "id": "anthropic/claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, "limit": { "context": 1000000, "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -24117,15 +23685,35 @@ "release_date": "2026-02-17", "last_updated": "2026-02-17", "cost": { - "input": 2.992, - "output": 14.993999999999998 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5 + } }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6:thinking", - "name": "Claude 4.6 Opus Thinking", - "display_name": "Claude 4.6 Opus Thinking", + "id": "anthropic/claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", @@ -24140,15 +23728,16 @@ "context": 1000000, "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "mixed", "budget": { "min": 1024, @@ -24173,168 +23762,295 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-05-31", "release_date": "2026-02-05", "last_updated": "2026-02-05", "cost": { - "input": 4.998, - "output": 25.007 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "tiers": [ + { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5 + } }, "type": "chat" }, { - "id": "abacusai/Dracarys-72B-Instruct", - "name": "Llama 3.1 70B Dracarys 2", - "display_name": "Llama 3.1 70B Dracarys 2", + "id": "anthropic/claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-02", - "last_updated": "2025-08-02", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "EVA-UNIT-01/EVA-LLaMA-3.33-70B-v0.0", - "name": "EVA Llama 3.33 70B", - "display_name": "EVA Llama 3.33 70B", + "id": "google/gemini-3-pro-preview", + "name": "Gemini 3 Pro", + "display_name": "Gemini 3 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 1048576, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 2.006, - "output": 2.006 + "input": 2, + "output": 12, + "cache_read": 0.2, + "cache_write": 4.5 }, "type": "chat" }, { - "id": "EVA-UNIT-01/EVA-Qwen2.5-72B-v0.2", - "name": "EVA-Qwen2.5-72B-v0.2", - "display_name": "EVA-Qwen2.5-72B-v0.2", + "id": "google/gemini-3-flash-preview", + "name": "Gemini 3 Flash", + "display_name": "Gemini 3 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 1048576, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.7989999999999999, - "output": 0.7989999999999999 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 1 }, "type": "chat" }, { - "id": "EVA-UNIT-01/EVA-LLaMA-3.33-70B-v0.1", - "name": "EVA-LLaMA-3.33-70B-v0.1", - "display_name": "EVA-LLaMA-3.33-70B-v0.1", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 1048576, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 2.006, - "output": 2.006 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.55 }, "type": "chat" }, { - "id": "EVA-UNIT-01/EVA-Qwen2.5-32B-v0.2", - "name": "EVA-Qwen2.5-32B-v0.2", - "display_name": "EVA-Qwen2.5-32B-v0.2", + "id": "xai/grok-4", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 256000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "knowledge": "2025-01", + "release_date": "2025-09-09", + "last_updated": "2025-09-09", "cost": { - "input": 0.7989999999999999, - "output": 0.7989999999999999 + "input": 3, + "output": 15, + "cache_read": 0.75, + "cache_write": 3 }, "type": "chat" }, { - "id": "huihui-ai/DeepSeek-R1-Distill-Qwen-32B-abliterated", - "name": "DeepSeek R1 Qwen Abliterated", - "display_name": "DeepSeek R1 Qwen Abliterated", + "id": "xai/grok-4-fast", + "name": "Grok 4 Fast", + "display_name": "Grok 4 Fast", "modalities": { "input": [ "text" @@ -24344,299 +24060,485 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 2000000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2025-01", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 1.4, - "output": 1.4 - }, - "type": "chat" + "input": 0.2, + "output": 0.5, + "cache_read": 0.05, + "cache_write": 0.2 + }, + "type": "chat" }, { - "id": "huihui-ai/DeepSeek-R1-Distill-Llama-70B-abliterated", - "name": "DeepSeek R1 Llama 70B Abliterated", - "display_name": "DeepSeek R1 Llama 70B Abliterated", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.7, - "output": 0.7 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "huihui-ai/Llama-3.3-70B-Instruct-abliterated", - "name": "Llama 3.3 70B Instruct abliterated", - "display_name": "Llama 3.3 70B Instruct abliterated", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 1047576, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.7, - "output": 0.7 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "huihui-ai/Qwen2.5-32B-Instruct-abliterated", - "name": "Qwen 2.5 32B Abliterated", - "display_name": "Qwen 2.5 32B Abliterated", + "id": "openai/gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 400000, + "output": 272000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-01-06", - "last_updated": "2025-01-06", + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 0.7, - "output": 0.7 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "huihui-ai/Llama-3.1-Nemotron-70B-Instruct-HF-abliterated", - "name": "Nemotron 3.1 70B abliterated", - "display_name": "Nemotron 3.1 70B abliterated", + "id": "openai/gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 1050000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.7, - "output": 0.7 + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + }, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash-thinking-original", - "name": "MiMo V2 Flash (Thinking) Original", - "display_name": "MiMo V2 Flash (Thinking) Original", + "id": "openai/gpt-5.2-chat", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 128000, + "output": 16384 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.102, - "output": 0.306 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash-thinking", - "name": "MiMo V2 Flash (Thinking)", - "display_name": "MiMo V2 Flash (Thinking)", + "id": "anthropic/claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 1000000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.102, - "output": 0.306 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash", - "name": "MiMo V2 Flash", - "display_name": "MiMo V2 Flash", + "id": "anthropic/claude-opus-4-1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.102, - "output": 0.306 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash-original", - "name": "MiMo V2 Flash Original", - "display_name": "MiMo V2 Flash Original", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.102, - "output": 0.306 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "tngtech/DeepSeek-TNG-R1T2-Chimera", - "name": "DeepSeek TNG R1T2 Chimera", - "display_name": "DeepSeek TNG R1T2 Chimera", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1048576, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.31, - "output": 0.31 + "input": 1.25, + "output": 10, + "cache_read": 0.31, + "cache_write": 2.375, + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + }, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" - }, + } + ] + }, + "zai": { + "id": "zai", + "name": "Z.AI", + "display_name": "Z.AI", + "api": "https://api.z.ai/api/paas/v4", + "doc": "https://docs.z.ai/guides/overview/pricing", + "models": [ { - "id": "tngtech/tng-r1t-chimera", - "name": "TNG R1T Chimera", - "display_name": "TNG R1T Chimera", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -24646,57 +24548,90 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 200000, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-11-26", - "last_updated": "2025-11-26", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.3, - "output": 1.2 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26, + "cache_write": 0 }, "type": "chat" }, { - "id": "inflatebot/MN-12B-Mag-Mell-R1", - "name": "Mag Mell R1", - "display_name": "Mag Mell R1", + "id": "glm-5v-turbo", + "name": "GLM-5V-Turbo", + "display_name": "GLM-5V-Turbo", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 200000, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 1.2, + "output": 4, + "cache_read": 0.24, + "cache_write": 0 }, "type": "chat" }, { - "id": "failspy/Meta-Llama-3-70B-Instruct-abliterated-v3.5", - "name": "Llama 3 70B abliterated", - "display_name": "Llama 3 70B abliterated", + "id": "glm-4.7-flashx", + "name": "GLM-4.7-FlashX", + "display_name": "GLM-4.7-FlashX", "modalities": { "input": [ "text" @@ -24706,104 +24641,80 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.7, - "output": 0.7 + "input": 0.07, + "output": 0.4, + "cache_read": 0.01, + "cache_write": 0 }, "type": "chat" - } - ] - }, - "abacus": { - "id": "abacus", - "name": "Abacus", - "display_name": "Abacus", - "api": "https://routellm.abacus.ai/v1", - "doc": "https://abacus.ai/help/api", - "models": [ + }, { - "id": "gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 98304 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 1.25, - "output": 10 + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, + "cache_write": 0 }, "type": "chat" }, { - "id": "claude-opus-4-5-20251101", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "glm-4.5v", + "name": "GLM-4.5V", + "display_name": "GLM-4.5V", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 64000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -24812,33 +24723,31 @@ "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "cost": { - "input": 5, - "output": 25 + "input": 0.6, + "output": 1.8 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -24848,45 +24757,37 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.6, - "output": 3 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gemini-3.1-flash-lite-preview", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -24899,98 +24800,69 @@ "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-01", - "last_updated": "2026-03-01", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 3, - "output": 15 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "glm-4.5-flash", + "name": "GLM-4.5-Flash", + "display_name": "GLM-4.5-Flash", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -24998,50 +24870,34 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 2, - "output": 12 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gpt-5.3-chat-latest", - "name": "GPT-5.3 Chat Latest", - "display_name": "GPT-5.3 Chat Latest", + "id": "glm-5-turbo", + "name": "GLM-5-Turbo", + "display_name": "GLM-5-Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -25049,35 +24905,44 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "release_date": "2026-03-01", - "last_updated": "2026-03-01", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 1.75, - "output": 14 + "input": 1.2, + "output": 4, + "cache_read": 0.24, + "cache_write": 0 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -25088,37 +24953,31 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.5, - "output": 3 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "llama-3.3-70b-versatile", - "name": "Llama 3.3 70B Versatile", - "display_name": "Llama 3.3 70B Versatile", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -25128,97 +24987,99 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.59, - "output": 0.79 + "input": 1, + "output": 3.2, + "cache_read": 0.2, + "cache_write": 0 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.25, - "output": 2 + "input": 0.3, + "output": 0.9 }, "type": "chat" - }, + } + ] + }, + "zai-coding-plan": { + "id": "zai-coding-plan", + "name": "Z.AI Coding Plan", + "display_name": "Z.AI Coding Plan", + "api": "https://api.z.ai/api/coding/paas/v4", + "doc": "https://docs.z.ai/devpack/overview", + "models": [ { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -25227,100 +25088,68 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.05, - "output": 0.4 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 98304 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 1.75, - "output": 14 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "glm-5-turbo", + "name": "GLM-5-Turbo", + "display_name": "GLM-5-Turbo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -25328,7 +25157,7 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -25336,36 +25165,44 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 3, - "output": 15 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -25376,139 +25213,145 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 1.25, - "output": 10 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "Grok 4.1 Fast (Non-Reasoning)", - "display_name": "Grok 4.1 Fast (Non-Reasoning)", + "id": "glm-5v-turbo", + "name": "GLM-5V-Turbo", + "display_name": "GLM-5V-Turbo", "modalities": { "input": [ "text", - "image" + "image", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 16384 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-11-17", - "last_updated": "2025-11-17", + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "deepinfra": { + "id": "deepinfra", + "name": "Deep Infra", + "display_name": "Deep Infra", + "doc": "https://deepinfra.com/models", + "models": [ { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 163840, + "output": 64000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 1.75, - "output": 14 + "input": 0.5, + "output": 2.15, + "cache_read": 0.35 }, "type": "chat" }, { - "id": "o3-pro", - "name": "o3-pro", - "display_name": "o3-pro", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 163840, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -25517,65 +25360,62 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-06-10", - "last_updated": "2025-06-10", + "knowledge": "2024-12", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 20, - "output": 40 + "input": 0.26, + "output": 0.38, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "gpt-4o-mini", - "name": "GPT-4o Mini", - "display_name": "GPT-4o Mini", + "id": "moonshotai/Kimi-K2-Instruct", + "name": "Kimi K2", + "display_name": "Kimi K2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.5, + "output": 2 }, "type": "chat" }, { - "id": "qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -25586,7 +25426,7 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -25606,33 +25446,35 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-11-06", + "last_updated": "2025-11-07", "cost": { - "input": 1.2, - "output": 6 + "input": 0.47, + "output": 2 }, "type": "chat" }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262144, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -25641,47 +25483,45 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 1.1, - "output": 4.4 + "input": 0.75, + "output": 3.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -25690,108 +25530,73 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 1.75, - "output": 14 + "input": 0.5, + "output": 2.8 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.3, - "output": 2.5 + "input": 0.4, + "output": 2, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "gpt-5.2-chat-latest", - "name": "GPT-5.2 Chat Latest", - "display_name": "GPT-5.2 Chat Latest", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -25799,36 +25604,38 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2026-01-01", - "last_updated": "2026-01-01", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.75, - "output": 14 + "input": 0.03, + "output": 0.14 }, "type": "chat" }, { - "id": "gpt-5.3-codex-xhigh", - "name": "GPT-5.3 Codex XHigh", - "display_name": "GPT-5.3 Codex XHigh", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -25836,132 +25643,100 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.75, - "output": 14 + "input": 0.05, + "output": 0.24 }, "type": "chat" }, { - "id": "grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "zai-org/GLM-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-01", - "last_updated": "2025-09-01", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.2, - "output": 1.5 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "zai-org/GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 202752, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 1.25, - "output": 10 + "input": 0.43, + "output": 1.75, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "zai-org/GLM-4.7-Flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ "text" @@ -25971,10 +25746,10 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 202752, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -25983,43 +25758,39 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 1.1, - "output": 4.4 + "input": 0.06, + "output": 0.4 }, "type": "chat" }, { - "id": "grok-4-0709", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "zai-org/GLM-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 202752, "output": 16384 }, "temperature": true, @@ -26028,53 +25799,78 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 3, - "output": 15 + "input": 0.8, + "output": 2.56, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "route-llm", - "name": "Route LLM", - "display_name": "Route LLM", + "id": "zai-org/GLM-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 202752, "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 3, - "output": 15 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "qwen-2.5-coder-32b", - "name": "Qwen 2.5 Coder 32B", - "display_name": "Qwen 2.5 Coder 32B", + "id": "zai-org/GLM-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -26084,28 +25880,42 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2024-11-11", - "last_updated": "2024-11-11", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.79, - "output": 0.79 + "input": 0.43, + "output": 1.74, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "gpt-5-codex", - "name": "GPT-5 Codex", - "display_name": "GPT-5 Codex", + "id": "zai-org/GLM-4.6V", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ "text", @@ -26116,10 +25926,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -26128,44 +25938,33 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "attachment": true, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 1.25, - "output": 10 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "claude-opus-4-1-20250805", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "anthropic/claude-3-7-sonnet-latest", + "name": "Claude Sonnet 3.7 (Latest)", + "display_name": "Claude Sonnet 3.7 (Latest)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -26173,28 +25972,50 @@ }, "limit": { "context": 200000, - "output": 32000 + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-10-31", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 15, - "output": 75 + "input": 3.3, + "output": 16.5, + "cache_read": 0.33 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "anthropic/claude-4-opus", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ "text", @@ -26205,155 +26026,121 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 200000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2025-03-31", + "release_date": "2025-06-12", + "last_updated": "2025-06-12", "cost": { - "input": 2.5, - "output": 15 + "input": 16.5, + "output": 82.5 }, "type": "chat" }, { - "id": "gpt-5.1-chat-latest", - "name": "GPT-5.1 Chat Latest", - "display_name": "GPT-5.1 Chat Latest", + "id": "meta-llama/Llama-3.1-8B-Instruct", + "name": "Llama 3.1 8B", + "display_name": "Llama 3.1 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 16384 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 1.25, - "output": 10 + "input": 0.02, + "output": 0.05 }, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "meta-llama/Llama-3.1-70B-Instruct-Turbo", + "name": "Llama 3.1 70B Turbo", + "display_name": "Llama 3.1 70B Turbo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 1, - "output": 5 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "claude-sonnet-4-20250514", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", + "name": "Llama 4 Scout 17B", + "display_name": "Llama 4 Scout 17B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 10000000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-14", - "last_updated": "2025-05-14", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 3, - "output": 15 + "input": 0.08, + "output": 0.3 }, "type": "chat" }, { - "id": "kimi-k2-turbo-preview", - "name": "Kimi K2 Turbo Preview", - "display_name": "Kimi K2 Turbo Preview", + "id": "meta-llama/Llama-3.1-70B-Instruct", + "name": "Llama 3.1 70B", + "display_name": "Llama 3.1 70B", "modalities": { "input": [ "text" @@ -26363,89 +26150,87 @@ ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 131072, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-08", - "last_updated": "2025-07-08", + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.15, - "output": 8 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "meta-llama/Llama-3.1-8B-Instruct-Turbo", + "name": "Llama 3.1 8B Turbo", + "display_name": "Llama 3.1 8B Turbo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 131072, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0.02, + "output": 0.03 }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "type": "chat" + }, + { + "id": "meta-llama/Llama-3.3-70B-Instruct-Turbo", + "name": "Llama 3.3 70B Turbo", + "display_name": "Llama 3.3 70B Turbo", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 16384 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 5, - "output": 25 + "input": 0.1, + "output": 0.32 }, "type": "chat" }, { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 Nano", - "display_name": "GPT-4.1 Nano", + "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", + "name": "Llama 4 Maverick 17B FP8", + "display_name": "Llama 4 Maverick 17B FP8", "modalities": { "input": [ "text", @@ -26456,98 +26241,84 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 1000000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-20250219", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "MiniMaxAI/MiniMax-M2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 196608, + "output": 196608 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", + "interleaved": true, + "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "attachment": false, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 3, - "output": 15 + "input": 0.28, + "output": 1.2 }, "type": "chat" }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -26556,46 +26327,44 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "attachment": false, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 2, - "output": 8 + "input": 0.27, + "output": 0.95, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "MiniMaxAI/MiniMax-M2", + "name": "MiniMax M2", + "display_name": "MiniMax M2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -26604,129 +26373,129 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 1.25, - "output": 10 + "input": 0.254, + "output": 1.02 }, "type": "chat" }, { - "id": "claude-opus-4-20250514", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo", + "name": "Qwen3 Coder 480B A35B Instruct Turbo", + "display_name": "Qwen3 Coder 480B A35B Instruct Turbo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 262144, + "output": 66536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-14", - "last_updated": "2025-05-14", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 15, - "output": 75 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "Qwen/Qwen3.5-397B-A17B", + "name": "Qwen 3.5 397B A17B", + "display_name": "Qwen 3.5 397B A17B", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 262144, + "output": 81920 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-02-01", + "last_updated": "2026-04-20", "cost": { - "input": 2, - "output": 8 + "input": 0.54, + "output": 3.4 }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 Mini", - "display_name": "GPT-4.1 Mini", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 262144, + "output": 66536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { "input": 0.4, "output": 1.6 @@ -26734,130 +26503,145 @@ "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "Qwen/Qwen3.5-35B-A3B", + "name": "Qwen 3.5 35B A3B", + "display_name": "Qwen 3.5 35B A3B", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 81920 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-02-01", + "last_updated": "2026-04-20", "cost": { - "input": 1.25, - "output": 10 + "input": 0.2, + "output": 0.95 }, "type": "chat" }, { - "id": "gpt-4o-2024-11-20", - "name": "GPT-4o (2024-11-20)", - "display_name": "GPT-4o (2024-11-20)", + "id": "Qwen/Qwen3.6-35B-A3B", + "name": "Qwen3.6 35B A3B", + "display_name": "Qwen3.6 35B A3B", "modalities": { "input": [ "text", "image", - "audio" + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 81920 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-11-20", - "last_updated": "2024-11-20", + "open_weights": true, + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 2.5, - "output": 10 + "input": 0.2, + "output": 1 }, "type": "chat" }, { - "id": "grok-4-fast-non-reasoning", - "name": "Grok 4 Fast (Non-Reasoning)", - "display_name": "Grok 4 Fast (Non-Reasoning)", + "id": "deepseek-ai/DeepSeek-V4-Flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 16384 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "deepseek-ai/DeepSeek-V4-Pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -26867,8 +26651,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -26876,31 +26660,45 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.55, - "output": 1.66 + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "Qwen/QwQ-32B", - "name": "QwQ 32B", - "display_name": "QwQ 32B", + "id": "google/gemma-4-26B-A4B-it", + "name": "Gemma 4 26B", + "display_name": "Gemma 4 26B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -26908,41 +26706,31 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2024-11-28", - "last_updated": "2024-11-28", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.4, - "output": 0.4 + "input": 0.07, + "output": 0.34 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct", - "display_name": "Qwen3 235B A22B Instruct", + "id": "google/gemma-4-31B-it", + "name": "Gemma 4 31B", + "display_name": "Gemma 4 31B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 256000, "output": 8192 }, "temperature": true, @@ -26953,18 +26741,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { "input": 0.13, - "output": 0.6 + "output": 0.38 }, "type": "chat" }, { - "id": "Qwen/Qwen3-32B", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "xiaomi/mimo-v2.5-pro", + "name": "MiMo-V2.5-Pro", + "display_name": "MiMo-V2.5-Pro", "modalities": { "input": [ "text" @@ -26974,8 +26762,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1048576, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -26996,21 +26784,42 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.09, - "output": 0.29 + "input": 1, + "output": 3, + "cache_read": 0.2, + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ] }, "type": "chat" }, { - "id": "Qwen/qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "xiaomi/mimo-v2.5", + "name": "MiMo-V2.5", + "display_name": "MiMo-V2.5", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" @@ -27018,7 +26827,7 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -27026,93 +26835,123 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "release_date": "2025-07-22", - "last_updated": "2025-07-22", + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.29, - "output": 1.2 + "input": 0.4, + "output": 2, + "cache_read": 0.08, + "context_over_200k": { + "input": 0.8, + "output": 4, + "cache_read": 0.16 + }, + "tiers": [ + { + "input": 0.8, + "output": 4, + "cache_read": 0.16, + "tier": { + "type": "context", + "size": 256000 + } + } + ] }, "type": "chat" - }, + } + ] + }, + "clarifai": { + "id": "clarifai", + "name": "Clarifai", + "display_name": "Clarifai", + "api": "https://api.clarifai.com/v2/ext/openai/v1", + "doc": "https://docs.clarifai.com/compute/inference/", + "models": [ { - "id": "Qwen/Qwen2.5-72B-Instruct", - "name": "Qwen 2.5 72B Instruct", - "display_name": "Qwen 2.5 72B Instruct", + "id": "deepseek-ai/deepseek-ocr/models/DeepSeek-OCR", + "name": "DeepSeek OCR", + "display_name": "DeepSeek OCR", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 8192, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2024-09-19", - "last_updated": "2024-09-19", + "release_date": "2025-10-20", + "last_updated": "2026-02-25", "cost": { - "input": 0.11, - "output": 0.38 + "input": 0.2, + "output": 0.7 }, "type": "chat" }, { - "id": "zai-org/glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "clarifai/main/models/mm-poly-8b", + "name": "MM Poly 8B", + "display_name": "MM Poly 8B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 32768, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "attachment": true, + "open_weights": false, + "release_date": "2025-06", + "last_updated": "2026-02-25", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0.658, + "output": 1.11 }, "type": "chat" }, { - "id": "zai-org/glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "openai/chat-completion/models/gpt-oss-120b-high-throughput", + "name": "GPT OSS 120B High Throughput", + "display_name": "GPT OSS 120B High Throughput", "modalities": { "input": [ "text" @@ -27122,8 +26961,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -27131,31 +26970,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2025-08-05", + "last_updated": "2026-02-25", "cost": { - "input": 1, - "output": 3.2 + "input": 0.09, + "output": 0.36 }, "type": "chat" }, { - "id": "zai-org/glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "openai/chat-completion/models/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -27165,8 +26993,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -27174,20 +27002,25 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-08-05", + "last_updated": "2025-12-12", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0.045, + "output": 0.18 }, "type": "chat" }, { - "id": "zai-org/glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "arcee_ai/AFM/models/trinity-mini", + "name": "Trinity Mini", + "display_name": "Trinity Mini", "modalities": { "input": [ "text" @@ -27197,64 +27030,64 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "knowledge": "2024-10", + "release_date": "2025-12", + "last_updated": "2026-02-25", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0.045, + "output": 0.15 }, "type": "chat" }, { - "id": "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo", - "name": "Llama 3.1 405B Instruct Turbo", - "display_name": "Llama 3.1 405B Instruct Turbo", + "id": "mistralai/completion/models/Ministral-3-14B-Reasoning-2512", + "name": "Ministral 3 14B Reasoning 2512", + "display_name": "Ministral 3 14B Reasoning 2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2025-12", + "release_date": "2025-12-01", + "last_updated": "2025-12-12", "cost": { - "input": 3.5, - "output": 3.5 + "input": 2.5, + "output": 1.7 }, "type": "chat" }, { - "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", - "name": "Llama 4 Maverick 17B 128E Instruct FP8", - "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", + "id": "mistralai/completion/models/Ministral-3-3B-Reasoning-2512", + "name": "Ministral 3 3B Reasoning 2512", + "display_name": "Ministral 3 3B Reasoning 2512", "modalities": { "input": [ "text", @@ -27265,29 +27098,29 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2025-12", + "last_updated": "2026-02-25", "cost": { - "input": 0.14, - "output": 0.59 + "input": 1.039, + "output": 0.54825 }, "type": "chat" }, { - "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "qwen/qwenCoder/models/Qwen3-Coder-30B-A3B-Instruct", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ "text" @@ -27297,8 +27130,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -27307,18 +27140,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2025-04", + "release_date": "2025-07-31", + "last_updated": "2026-02-12", "cost": { - "input": 0.02, - "output": 0.05 + "input": 0.11458, + "output": 0.74812 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "qwen/qwenLM/models/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ "text" @@ -27328,40 +27162,28 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2025-07-30", + "last_updated": "2026-02-25", "cost": { - "input": 3, - "output": 7 + "input": 0.3, + "output": 0.5 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "qwen/qwenLM/models/Qwen3-30B-A3B-Thinking-2507", + "name": "Qwen3 30B A3B Thinking 2507", + "display_name": "Qwen3 30B A3B Thinking 2507", "modalities": { "input": [ "text" @@ -27371,8 +27193,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -27382,23 +27204,29 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2025-06-15", - "last_updated": "2025-06-15", + "release_date": "2025-07-31", + "last_updated": "2026-02-25", "cost": { - "input": 0.27, - "output": 0.4 + "input": 0.36, + "output": 1.3 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", + "id": "minimaxai/chat-completion/models/MiniMax-M2_5-high-throughput", + "name": "MiniMax-M2.5 High Throughput", + "display_name": "MiniMax-M2.5 High Throughput", "modalities": { "input": [ "text" @@ -27408,8 +27236,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -27419,18 +27247,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-25", "cost": { - "input": 0.27, - "output": 1 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT-OSS 120B", - "display_name": "GPT-OSS 120B", + "id": "moonshotai/chat-completion/models/Kimi-K2_6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", @@ -27441,8 +27269,8 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -27452,32 +27280,39 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.08, - "output": 0.44 + "input": 0.95, + "output": 4 }, "type": "chat" } ] }, - "perplexity-agent": { - "id": "perplexity-agent", - "name": "Perplexity Agent", - "display_name": "Perplexity Agent", - "api": "https://api.perplexity.ai/v1", - "doc": "https://docs.perplexity.ai/docs/agent-api/models", + "moark": { + "id": "moark", + "name": "Moark", + "display_name": "Moark", + "api": "https://moark.com/v1", + "doc": "https://moark.com/docs/openapi/v1#tag/%E6%96%87%E6%9C%AC%E7%94%9F%E6%88%90", "models": [ { - "id": "perplexity/sonar", - "name": "Sonar", - "display_name": "Sonar", + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -27487,75 +27322,99 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.25, - "output": 2.5, - "cache_read": 0.0625 + "input": 2.1, + "output": 8.4 }, "type": "chat" }, { - "id": "xai/grok-4-1-fast-non-reasoning", - "name": "Grok 4.1 Fast (Non-Reasoning)", - "display_name": "Grok 4.1 Fast (Non-Reasoning)", + "id": "GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 3.5, + "output": 14 }, "type": "chat" - }, + } + ] + }, + "frogbot": { + "id": "frogbot", + "name": "FrogBot", + "display_name": "FrogBot", + "api": "https://app.frogbot.ai/api/v1", + "doc": "https://docs.frogbot.ai", + "models": [ { - "id": "nvidia/nemotron-3-super-120b-a12b", - "name": "Nemotron 3 Super 120B", - "display_name": "Nemotron 3 Super 120B", + "id": "kimi-k2.5", + "name": "Kimi-K2.5", + "display_name": "Kimi-K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32000 + "context": 256000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -27563,21 +27422,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": true, - "knowledge": "2026-02", - "release_date": "2026-03-11", - "last_updated": "2026-03-11", + "open_weights": false, + "release_date": "1970-01-01", + "last_updated": "1970-01-01", "cost": { - "input": 0.25, - "output": 2.5 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "openai/gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", @@ -27589,10 +27459,10 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -27600,41 +27470,26 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ "text", @@ -27645,165 +27500,123 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "grok-4-3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2024-11", + "release_date": "2026-04-30", + "last_updated": "2026-04-30", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { "input": 1.25, "output": 10, - "cache_read": 0.125 + "cache_read": 0.31 }, "type": "chat" }, { - "id": "openai/gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "grok-4-1-fast-reasoning", + "name": "Grok 4.1 Fast (Reasoning)", + "display_name": "Grok 4.1 Fast (Reasoning)", "modalities": { "input": [ "text", @@ -27814,130 +27627,94 @@ ] }, "limit": { - "context": 1050000, + "context": 2000000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2025-11", + "release_date": "2025-11-25", + "last_updated": "2025-11-25", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "google/gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "deepseek-v4-pro", + "name": "DeepSeek v4 Pro", + "display_name": "DeepSeek v4 Pro", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "knowledge": "2026-01", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 1.74, + "output": 3.48, + "cache_read": 0.14 }, "type": "chat" }, { - "id": "google/gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "gpt-5-5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -27947,119 +27724,84 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "context_over_200k": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 - } + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "grok-4-1-fast-non-reasoning", + "name": "Grok 4.1 Fast (Non-Reasoning)", + "display_name": "Grok 4.1 Fast (Non-Reasoning)", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 2000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2025-11", + "release_date": "2025-11-25", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "grok-code-fast-1", + "name": "Grok 4.1 Fast (Reasoning)", + "display_name": "Grok 4.1 Fast (Reasoning)", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 256000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -28069,53 +27811,69 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, + "attachment": false, + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", + "cost": { + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 + }, + "type": "chat" + }, + { + "id": "minimax-m2-7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 192000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2024-09", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { "input": 0.3, - "output": 2.5, - "cache_read": 0.03 + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -28128,20 +27886,18 @@ "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "release_date": "1970-01-01", + "last_updated": "1970-01-01", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1 + "input": 0.07, + "output": 0.2 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-6", + "id": "claude-sonnet-4-6", "name": "Claude Sonnet 4.6", "display_name": "Claude Sonnet 4.6", "modalities": { @@ -28198,89 +27954,63 @@ "cost": { "input": 3, "output": 15, - "cache_read": 0.3 + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "kimi-k2-6", + "name": "Kimi-K2.6", + "display_name": "Kimi-K2.6", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 256000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "release_date": "1970-01-01", + "last_updated": "1970-01-01", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "gpt-5-3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -28288,25 +28018,41 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "knowledge": "2026-01-31", + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", @@ -28321,7 +28067,7 @@ "context": 200000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -28331,44 +28077,43 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", + "mode": "effort", + "effort": "high", "effort_options": [ "low", "medium", - "high" + "high", + "xhigh" ], "interleaved": true, "summaries": true, - "visibility": "summary", "continuation": [ "thinking_blocks" ], "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { "input": 5, "output": 25, - "cache_read": 0.5 + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "qwen-3-6-plus", + "name": "Qwen 3.6 Plus", + "display_name": "Qwen 3.6 Plus", "modalities": { "input": [ "text", @@ -28380,7 +28125,7 @@ ] }, "limit": { - "context": 200000, + "context": 1000000, "output": 64000 }, "temperature": true, @@ -28389,79 +28134,92 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2026-04-02", + "last_updated": "2026-04-03", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3 + "input": 0.5, + "output": 3, + "cache_read": 0.1 }, "type": "chat" - } - ] - }, - "siliconflow": { - "id": "siliconflow", - "name": "SiliconFlow", - "display_name": "SiliconFlow", - "api": "https://api.siliconflow.cn/v1", - "doc": "https://cloud.siliconflow.com/models", - "models": [ + }, { - "id": "Kwaipilot/KAT-Dev", - "name": "Kwaipilot/KAT-Dev", - "display_name": "Kwaipilot/KAT-Dev", + "id": "gpt-5-4-nano", + "name": "GPT-5.4 Nano", + "display_name": "GPT-5.4 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-09-27", - "last_updated": "2026-01-16", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { "input": 0.2, - "output": 0.6 + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-397B-A17B", - "name": "Qwen/Qwen3.5-397B-A17B", - "display_name": "Qwen/Qwen3.5-397B-A17B", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ "text", "image", - "video" + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1048576, "output": 65536 }, "temperature": true, @@ -28473,87 +28231,109 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.29, - "output": 1.74 + "input": 0.5, + "output": 3, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-35B-A3B", - "name": "Qwen/Qwen3.5-35B-A3B", - "display_name": "Qwen/Qwen3.5-35B-A3B", + "id": "gpt-5-4-mini", + "name": "GPT-5.4 Mini", + "display_name": "GPT-5.4 Mini", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-25", - "last_updated": "2026-02-25", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.23, - "output": 1.86 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-122B-A10B", - "name": "Qwen/Qwen3.5-122B-A10B", - "display_name": "Qwen/Qwen3.5-122B-A10B", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", - "video" + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1048576, "output": 65536 }, "temperature": true, @@ -28565,180 +28345,179 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-07-17", + "last_updated": "2025-07-17", "cost": { - "input": 0.29, - "output": 2.32 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-9B", - "name": "Qwen/Qwen3.5-9B", - "display_name": "Qwen/Qwen3.5-9B", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.22, - "output": 1.74 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-27B", - "name": "Qwen/Qwen3.5-27B", - "display_name": "Qwen/Qwen3.5-27B", + "id": "zai-glm-5-1", + "name": "Z.AI GLM-5.1", + "display_name": "Z.AI GLM-5.1", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 198000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-25", - "last_updated": "2026-02-25", + "knowledge": "2024-10", + "release_date": "2025-01-20", + "last_updated": "2025-02-22", "cost": { - "input": 0.26, - "output": 2.09 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-4B", - "name": "Qwen/Qwen3.5-4B", - "display_name": "Qwen/Qwen3.5-4B", + "id": "minimax-m2-5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 192000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2025-01-15", + "last_updated": "2025-02-22", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "Qwen/Qwen3.6-35B-A3B", - "name": "Qwen/Qwen3.6-35B-A3B", - "display_name": "Qwen/Qwen3.6-35B-A3B", + "id": "gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -28748,61 +28527,69 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "release_date": "1970-01-01", + "last_updated": "1970-01-01", "cost": { - "input": 0.23, - "output": 1.86 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-72B-Instruct", - "name": "Qwen/Qwen2.5-72B-Instruct", - "display_name": "Qwen/Qwen2.5-72B-Instruct", + "id": "gemini-3-1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "knowledge": "2026-01", + "release_date": "2026-02-18", + "last_updated": "2026-02-18", "cost": { - "input": 0.59, - "output": 0.59 + "input": 2, + "output": 12, + "cache_read": 0.2 }, "type": "chat" - }, + } + ] + }, + "cohere": { + "id": "cohere", + "name": "Cohere", + "display_name": "Cohere", + "doc": "https://docs.cohere.com/docs/models", + "models": [ { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "display_name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "id": "c4ai-aya-expanse-32b", + "name": "Aya Expanse 32B", + "display_name": "Aya Expanse 32B", "modalities": { "input": [ "text" @@ -28812,59 +28599,57 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-31", - "last_updated": "2025-11-25", - "cost": { - "input": 0.25, - "output": 1 - } + "open_weights": true, + "release_date": "2024-10-24", + "last_updated": "2024-10-24", + "type": "chat" }, { - "id": "Qwen/Qwen3-VL-8B-Instruct", - "name": "Qwen/Qwen3-VL-8B-Instruct", - "display_name": "Qwen/Qwen3-VL-8B-Instruct", + "id": "command-a-reasoning-08-2025", + "name": "Command A Reasoning", + "display_name": "Command A Reasoning", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.18, - "output": 0.68 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-32B-Instruct", - "name": "Qwen/Qwen3-VL-32B-Instruct", - "display_name": "Qwen/Qwen3-VL-32B-Instruct", + "id": "c4ai-aya-vision-8b", + "name": "Aya Vision 8B", + "display_name": "Aya Vision 8B", "modalities": { "input": [ "text", @@ -28875,28 +28660,24 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 16000, + "output": 4000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-10-21", - "last_updated": "2025-11-25", - "cost": { - "input": 0.2, - "output": 0.6 - }, + "open_weights": true, + "release_date": "2025-03-04", + "last_updated": "2025-05-14", "type": "chat" }, { - "id": "Qwen/Qwen3-VL-30B-A3B-Thinking", - "name": "Qwen/Qwen3-VL-30B-A3B-Thinking", - "display_name": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "id": "command-r-08-2024", + "name": "Command R", + "display_name": "Command R", "modalities": { "input": [ "text" @@ -28906,40 +28687,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-11", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0.29, - "output": 1 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-14B-Instruct", - "name": "Qwen/Qwen2.5-14B-Instruct", - "display_name": "Qwen/Qwen2.5-14B-Instruct", + "id": "command-a-03-2025", + "name": "Command A", + "display_name": "Command A", "modalities": { "input": [ "text" @@ -28949,8 +28719,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 8000 }, "temperature": true, "tool_call": true, @@ -28958,19 +28728,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 0.1, - "output": 0.1 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "id": "c4ai-aya-expanse-8b", + "name": "Aya Expanse 8B", + "display_name": "Aya Expanse 8B", "modalities": { "input": [ "text" @@ -28980,28 +28751,57 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 8000, + "output": 4000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "release_date": "2024-10-24", + "last_updated": "2024-10-24", + "type": "chat" + }, + { + "id": "command-a-vision-07-2025", + "name": "Command A Vision", + "display_name": "Command A Vision", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8000 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "cost": { - "input": 0.3, - "output": 1.5 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "name": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "display_name": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "id": "command-r-plus-08-2024", + "name": "Command R+", + "display_name": "Command R+", "modalities": { "input": [ "text" @@ -29011,40 +28811,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0.14, - "output": 0.57 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-32B-Instruct", - "name": "Qwen/Qwen2.5-VL-32B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-32B-Instruct", + "id": "command-r7b-12-2024", + "name": "Command R7B", + "display_name": "Command R7B", "modalities": { "input": [ "text" @@ -29054,71 +28843,57 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-03-24", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-02-27", + "last_updated": "2024-02-27", "cost": { - "input": 0.27, - "output": 0.27 + "input": 0.0375, + "output": 0.15 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Thinking", - "name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "id": "c4ai-aya-vision-32b", + "name": "Aya Vision 32B", + "display_name": "Aya Vision 32B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 16000, + "output": 4000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", - "cost": { - "input": 0.1, - "output": 0.4 - }, + "open_weights": true, + "release_date": "2025-03-04", + "last_updated": "2025-05-14", "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "id": "command-r7b-arabic-02-2025", + "name": "Command R7B Arabic", + "display_name": "Command R7B Arabic", "modalities": { "input": [ "text" @@ -29128,40 +28903,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-02-27", + "last_updated": "2025-02-27", "cost": { - "input": 0.13, - "output": 0.6 + "input": 0.0375, + "output": 0.15 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-32B-Instruct", - "name": "Qwen/Qwen2.5-32B-Instruct", - "display_name": "Qwen/Qwen2.5-32B-Instruct", + "id": "command-a-translate-08-2025", + "name": "Command A Translate", + "display_name": "Command A Translate", "modalities": { "input": [ "text" @@ -29171,8 +28935,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 8000, + "output": 8000 }, "temperature": true, "tool_call": true, @@ -29180,19 +28944,29 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-09-19", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0.18, - "output": 0.18 + "input": 2.5, + "output": 10 }, "type": "chat" - }, + } + ] + }, + "wandb": { + "id": "wandb", + "name": "Weights & Biases", + "display_name": "Weights & Biases", + "api": "https://api.inference.wandb.ai/v1", + "doc": "https://docs.wandb.ai/guides/integrations/inference/", + "models": [ { - "id": "Qwen/Qwen2.5-72B-Instruct-128K", - "name": "Qwen/Qwen2.5-72B-Instruct-128K", - "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", + "id": "deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text" @@ -29202,8 +28976,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 161000, + "output": 161000 }, "temperature": true, "tool_call": true, @@ -29211,35 +28985,37 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2025-08-21", + "last_updated": "2026-03-12", "cost": { - "input": 0.59, - "output": 0.59 + "input": 0.55, + "output": 1.65 }, "type": "chat" }, { - "id": "Qwen/Qwen3-14B", - "name": "Qwen/Qwen3-14B", - "display_name": "Qwen/Qwen3-14B", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -29252,20 +29028,20 @@ ] } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-03-12", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.5, + "output": 2.85 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Instruct", - "name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "id": "openai/gpt-oss-20b", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ "text" @@ -29276,27 +29052,32 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "release_date": "2025-08-05", + "last_updated": "2026-03-12", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.05, + "output": 0.2 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", - "name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "id": "openai/gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ "text" @@ -29307,26 +29088,32 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-08-01", - "last_updated": "2025-11-25", + "release_date": "2025-08-05", + "last_updated": "2026-03-12", "cost": { - "input": 0.07, - "output": 0.28 - } + "input": 0.15, + "output": 0.6 + }, + "type": "chat" }, { - "id": "Qwen/Qwen3-32B", - "name": "Qwen/Qwen3-32B", - "display_name": "Qwen/Qwen3-32B", + "id": "zai-org/GLM-5-FP8", + "name": "GLM 5", + "display_name": "GLM 5", "modalities": { "input": [ "text" @@ -29336,39 +29123,28 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 200000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-03-12", "cost": { - "input": 0.14, - "output": 0.57 + "input": 1, + "output": 3.2 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "display_name": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "id": "nvidia/NVIDIA-Nemotron-3-Super-120B-A12B-FP8", + "name": "NVIDIA Nemotron 3 Super 120B", + "display_name": "NVIDIA Nemotron 3 Super 120B", "modalities": { "input": [ "text" @@ -29378,8 +29154,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -29387,19 +29163,19 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-23", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2026-03-11", + "last_updated": "2026-03-12", "cost": { - "input": 0.09, - "output": 0.6 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "display_name": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "id": "microsoft/Phi-4-mini-instruct", + "name": "Phi-4-mini-instruct", + "display_name": "Phi-4-mini-instruct", "modalities": { "input": [ "text" @@ -29409,28 +29185,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-30", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2026-03-12", "cost": { - "input": 0.09, - "output": 0.3 + "input": 0.08, + "output": 0.35 }, "type": "chat" }, { - "id": "Qwen/Qwen3-8B", - "name": "Qwen/Qwen3-8B", - "display_name": "Qwen/Qwen3-8B", + "id": "OpenPipe/Qwen3-14B-Instruct", + "name": "OpenPipe Qwen3 14B Instruct", + "display_name": "OpenPipe Qwen3 14B Instruct", "modalities": { "input": [ "text" @@ -29440,39 +29218,28 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2025-04-29", + "last_updated": "2026-03-12", "cost": { - "input": 0.06, - "output": 0.06 + "input": 0.05, + "output": 0.22 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "id": "meta-llama/Llama-3.1-8B-Instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" @@ -29482,28 +29249,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2026-03-12", "cost": { - "input": 0.14, - "output": 1.4 + "input": 0.22, + "output": 0.22 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-8B-Thinking", - "name": "Qwen/Qwen3-VL-8B-Thinking", - "display_name": "Qwen/Qwen3-VL-8B-Thinking", + "id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "display_name": "Llama 4 Scout 17B 16E Instruct", "modalities": { "input": [ "text", @@ -29514,8 +29283,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 64000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -29523,31 +29292,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-31", + "last_updated": "2026-03-12", "cost": { - "input": 0.18, - "output": 2 + "input": 0.17, + "output": 0.66 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Captioner", - "name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "id": "meta-llama/Llama-3.1-70B-Instruct", + "name": "Llama 3.1 70B", + "display_name": "Llama 3.1 70B", "modalities": { "input": [ "text" @@ -29557,28 +29316,28 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2026-03-12", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.8, + "output": 0.8 }, "type": "chat" }, { - "id": "Qwen/QwQ-32B", - "name": "Qwen/QwQ-32B", - "display_name": "Qwen/QwQ-32B", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -29588,14 +29347,84 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2026-03-12", + "cost": { + "input": 0.71, + "output": 0.71 + }, + "type": "chat" + }, + { + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 196608, + "output": 196608 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-03-12", + "cost": { + "input": 0.3, + "output": 1.2 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen3-235B-A22B-Thinking-2507", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, "extra_capabilities": { "reasoning": { "supported": true, @@ -29608,19 +29437,20 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-03-06", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2026-03-12", "cost": { - "input": 0.15, - "output": 0.58 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", - "name": "Qwen/Qwen3-VL-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ "text" @@ -29630,28 +29460,28 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-05", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-29", + "last_updated": "2026-03-12", "cost": { - "input": 0.29, - "output": 1 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-Coder-32B-Instruct", - "name": "Qwen/Qwen2.5-Coder-32B-Instruct", - "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -29661,8 +29491,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -29670,18 +29500,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-11-11", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2026-03-12", "cost": { - "input": 0.18, - "output": 0.18 - } + "input": 0.1, + "output": 0.1 + }, + "type": "chat" }, { - "id": "Qwen/Qwen2.5-7B-Instruct", - "name": "Qwen/Qwen2.5-7B-Instruct", - "display_name": "Qwen/Qwen2.5-7B-Instruct", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen3-Coder-480B-A35B-Instruct", + "display_name": "Qwen3-Coder-480B-A35B-Instruct", "modalities": { "input": [ "text" @@ -29691,8 +29523,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -29700,19 +29532,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2026-03-12", "cost": { - "input": 0.05, - "output": 0.05 + "input": 1, + "output": 1.5 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-235B-A22B-Thinking", - "name": "Qwen/Qwen3-VL-235B-A22B-Thinking", - "display_name": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "id": "zai-org/GLM-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -29722,8 +29555,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -29742,20 +29575,31 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.45, - "output": 3.5 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "gmicloud": { + "id": "gmicloud", + "name": "GMI Cloud", + "display_name": "GMI Cloud", + "api": "https://api.gmi-serving.com/v1", + "doc": "https://docs.gmicloud.ai/inference-engine/api-reference/llm-api-reference", + "models": [ { - "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", - "name": "Qwen/Qwen3-30B-A3B-Thinking-2507", - "display_name": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "id": "deepseek-ai/DeepSeek-V4-Flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -29765,8 +29609,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048575, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -29786,31 +29630,32 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-31", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.09, - "output": 0.3 + "input": 0.112, + "output": 0.224, + "cache_read": 0.022 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-32B-Thinking", - "name": "Qwen/Qwen3-VL-32B-Thinking", - "display_name": "Qwen/Qwen3-VL-32B-Thinking", + "id": "deepseek-ai/DeepSeek-V4-Pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1048576, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -29829,20 +29674,22 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-21", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.2, - "output": 1.5 + "input": 1.392, + "output": 2.784, + "cache_read": 0.116 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-72B-Instruct", - "name": "Qwen/Qwen2.5-VL-72B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-72B-Instruct", + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text" @@ -29852,28 +29699,42 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "release_date": "2025-01-28", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.59, - "output": 0.59 + "input": 0.855, + "output": 3.6, + "cache_read": 0.144 }, "type": "chat" }, { - "id": "stepfun-ai/Step-3.5-Flash", - "name": "stepfun-ai/Step-3.5-Flash", - "display_name": "stepfun-ai/Step-3.5-Flash", + "id": "zai-org/GLM-5.1-FP8", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -29883,8 +29744,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -29892,20 +29753,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.98, + "output": 3.08, + "cache_read": 0.182 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5V", - "name": "zai-org/GLM-4.5V", - "display_name": "zai-org/GLM-4.5V", + "id": "zai-org/GLM-5-FP8", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -29915,28 +29788,41 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-13", - "last_updated": "2025-11-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.14, - "output": 0.86 + "input": 0.6, + "output": 1.92, + "cache_read": 0.12 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6", - "name": "zai-org/GLM-4.6", - "display_name": "zai-org/GLM-4.6", + "id": "anthropic/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text" @@ -29946,66 +29832,117 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 409600, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.5, - "output": 1.9 + "input": 3, + "output": 15, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6V", - "name": "zai-org/GLM-4.6V", - "display_name": "zai-org/GLM-4.6V", + "id": "anthropic/claude-opus-4.6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 409600, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-12-07", - "last_updated": "2025-12-07", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.3, - "output": 0.9 + "input": 5, + "output": 25, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5-Air", - "name": "zai-org/GLM-4.5-Air", - "display_name": "zai-org/GLM-4.5-Air", + "id": "anthropic/claude-opus-4.7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text" @@ -30015,59 +29952,111 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 409600, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.14, - "output": 0.86 + "input": 4.5, + "output": 22.5, + "cache_read": 0.45 }, "type": "chat" - }, + } + ] + }, + "ambient": { + "id": "ambient", + "name": "Ambient", + "display_name": "Ambient", + "api": "https://api.ambient.xyz/v1", + "doc": "https://ambient.xyz", + "models": [ { - "id": "inclusionAI/Ling-flash-2.0", - "name": "inclusionAI/Ling-flash-2.0", - "display_name": "inclusionAI/Ling-flash-2.0", + "id": "moonshotai/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.95, + "output": 4, + "cache_read": 0.2, + "cache_write": 0 }, "type": "chat" }, { - "id": "inclusionAI/Ling-mini-2.0", - "name": "inclusionAI/Ling-mini-2.0", - "display_name": "inclusionAI/Ling-mini-2.0", + "id": "zai-org/GLM-5.1-FP8", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -30077,28 +30066,51 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-09-10", - "last_updated": "2025-11-25", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.07, - "output": 0.28 + "input": 1.4, + "output": 4.4, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "routing-run": { + "id": "routing-run", + "name": "routing.run", + "display_name": "routing.run", + "api": "https://api.routing.run/v1", + "doc": "https://docs.routing.run/api-reference/models", + "models": [ { - "id": "inclusionAI/Ring-flash-2.0", - "name": "inclusionAI/Ring-flash-2.0", - "display_name": "inclusionAI/Ring-flash-2.0", + "id": "route/deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -30108,8 +30120,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, @@ -30123,40 +30135,55 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.4928, + "output": 0.7392 }, "type": "chat" }, { - "id": "ascend-tribe/pangu-pro-moe", - "name": "ascend-tribe/pangu-pro-moe", - "display_name": "ascend-tribe/pangu-pro-moe", + "id": "route/qwen3.5-9b", + "name": "Qwen3.5 9B", + "display_name": "Qwen3.5 9B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-07-02", - "last_updated": "2026-01-16", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-03-10", + "last_updated": "2026-03-10", "cost": { "input": 0.2, "output": 0.6 @@ -30164,84 +30191,69 @@ "type": "chat" }, { - "id": "tencent/Hunyuan-MT-7B", - "name": "tencent/Hunyuan-MT-7B", - "display_name": "tencent/Hunyuan-MT-7B", + "id": "route/qwen3.5-9b-chat", + "name": "Qwen3.5 9B Chat", + "display_name": "Qwen3.5 9B Chat", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - }, - { - "id": "tencent/Hunyuan-A13B-Instruct", - "name": "tencent/Hunyuan-A13B-Instruct", - "display_name": "tencent/Hunyuan-A13B-Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 + "supported": true, + "default": true }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-06-30", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "release_date": "2026-03-10", + "last_updated": "2026-03-10", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "Pro/zai-org/GLM-4.7", - "name": "Pro/zai-org/GLM-4.7", - "display_name": "Pro/zai-org/GLM-4.7", + "id": "route/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -30259,19 +30271,21 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0.462, + "output": 2.42, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "Pro/zai-org/GLM-5.1", - "name": "Pro/zai-org/GLM-5.1", - "display_name": "Pro/zai-org/GLM-5.1", + "id": "route/minimax-m2.7-highspeed", + "name": "MiniMax M2.7 Highspeed", + "display_name": "MiniMax M2.7 Highspeed", "modalities": { "input": [ "text" @@ -30281,8 +30295,8 @@ ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 100000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -30303,19 +30317,20 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1.4, - "output": 4.4, - "cache_write": 0 + "input": 0.33, + "output": 1.32, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "Pro/zai-org/GLM-5", - "name": "Pro/zai-org/GLM-5", - "display_name": "Pro/zai-org/GLM-5", + "id": "route/glm-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ "text" @@ -30325,8 +30340,8 @@ ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 202752, + "output": 202752 }, "temperature": true, "tool_call": true, @@ -30346,19 +30361,21 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { "input": 1, - "output": 3.2 + "output": 3, + "cache_read": 0.26, + "cache_write": 0 }, "type": "chat" }, { - "id": "Pro/deepseek-ai/DeepSeek-V3", - "name": "Pro/deepseek-ai/DeepSeek-V3", - "display_name": "Pro/deepseek-ai/DeepSeek-V3", + "id": "route/step-3.5-flash-full", + "name": "Step 3.5 Flash Full", + "display_name": "Step 3.5 Flash Full", "modalities": { "input": [ "text" @@ -30368,39 +30385,45 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-26", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-29", + "last_updated": "2026-02-13", "cost": { - "input": 0.25, - "output": 1 + "input": 0.096, + "output": 0.288, + "cache_read": 0.019 }, "type": "chat" }, { - "id": "Pro/deepseek-ai/DeepSeek-R1", - "name": "Pro/deepseek-ai/DeepSeek-R1", - "display_name": "Pro/deepseek-ai/DeepSeek-R1", + "id": "route/qwen3.6-27b", + "name": "Qwen3.6 27B", + "display_name": "Qwen3.6 27B", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -30419,33 +30442,35 @@ ] } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.5, - "output": 2.18 + "input": 1.1, + "output": 3.3 }, "type": "chat" }, { - "id": "Pro/deepseek-ai/DeepSeek-V3.2", - "name": "Pro/deepseek-ai/DeepSeek-V3.2", - "display_name": "Pro/deepseek-ai/DeepSeek-V3.2", + "id": "route/kimi-k2.5-highspeed", + "name": "Kimi K2.5 Highspeed", + "display_name": "Kimi K2.5 Highspeed", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 131072, + "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -30453,55 +30478,31 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-03", - "last_updated": "2025-12-03", - "cost": { - "input": 0.27, - "output": 0.42 - }, - "type": "chat" - }, - { - "id": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", - "display_name": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.27, - "output": 1 + "input": 0.6468, + "output": 3.388, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "Pro/moonshotai/Kimi-K2-Thinking", - "name": "Pro/moonshotai/Kimi-K2-Thinking", - "display_name": "Pro/moonshotai/Kimi-K2-Thinking", + "id": "route/deepseek-v4-pro-precision", + "name": "DeepSeek V4 Pro Precision", + "display_name": "DeepSeek V4 Pro Precision", "modalities": { "input": [ "text" @@ -30511,8 +30512,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1000000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -30532,31 +30533,32 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-11-07", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.55, - "output": 2.5 + "input": 0.7392, + "output": 1.1088, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "Pro/moonshotai/Kimi-K2.6", - "name": "Pro/moonshotai/Kimi-K2.6", - "display_name": "Pro/moonshotai/Kimi-K2.6", + "id": "route/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1000000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -30577,19 +30579,20 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.4928, + "output": 0.7392, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "Pro/moonshotai/Kimi-K2-Instruct-0905", - "name": "Pro/moonshotai/Kimi-K2-Instruct-0905", - "display_name": "Pro/moonshotai/Kimi-K2-Instruct-0905", + "id": "route/glm-5-highspeed", + "name": "GLM 5 Highspeed", + "display_name": "GLM 5 Highspeed", "modalities": { "input": [ "text" @@ -30599,40 +30602,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-08", - "last_updated": "2025-11-25", - "cost": { - "input": 0.4, - "output": 2 - }, - "type": "chat" - }, - { - "id": "Pro/moonshotai/Kimi-K2.5", - "name": "Pro/moonshotai/Kimi-K2.5", - "display_name": "Pro/moonshotai/Kimi-K2.5", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262000, - "output": 262000 + "context": 202752, + "output": 202752 }, "temperature": true, "tool_call": true, @@ -30653,18 +30624,20 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.45, - "output": 2.25 + "input": 1.1088, + "output": 3.542, + "cache_read": 0.2, + "cache_write": 0 }, "type": "chat" }, { - "id": "Pro/MiniMaxAI/MiniMax-M2.5", - "name": "Pro/MiniMaxAI/MiniMax-M2.5", - "display_name": "Pro/MiniMaxAI/MiniMax-M2.5", + "id": "route/mimo-v2.5-pro", + "name": "MiMo V2.5 Pro", + "display_name": "MiMo V2.5 Pro", "modalities": { "input": [ "text" @@ -30674,13 +30647,14 @@ ] }, "limit": { - "context": 192000, - "output": 131000 + "context": 1000000, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -30694,19 +30668,37 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-13", - "last_updated": "2026-02-13", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.3, - "output": 1.22 + "input": 0.45, + "output": 1.35, + "cache_read": 0.2, + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ] }, "type": "chat" }, { - "id": "Pro/MiniMaxAI/MiniMax-M2.1", - "name": "Pro/MiniMaxAI/MiniMax-M2.1", - "display_name": "Pro/MiniMaxAI/MiniMax-M2.1", + "id": "route/minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -30716,13 +30708,14 @@ ] }, "limit": { - "context": 197000, - "output": 131000 + "context": 100000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -30730,19 +30723,21 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.193, + "output": 1.238, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "PaddlePaddle/PaddleOCR-VL", - "name": "PaddlePaddle/PaddleOCR-VL", - "display_name": "PaddlePaddle/PaddleOCR-VL", + "id": "route/gemma-4-31b-it", + "name": "Gemma 4 31B IT", + "display_name": "Gemma 4 31B IT", "modalities": { "input": [ "text", @@ -30753,90 +30748,115 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 131072, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-10-16", - "last_updated": "2025-10-16", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "PaddlePaddle/PaddleOCR-VL-1.5", - "name": "PaddlePaddle/PaddleOCR-VL-1.5", - "display_name": "PaddlePaddle/PaddleOCR-VL-1.5", + "id": "route/qwen3.5-397b-a17b", + "name": "Qwen3.5 397B-A17B", + "display_name": "Qwen3.5 397B-A17B", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": true, - "release_date": "2026-01-29", - "last_updated": "2026-01-29", + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 0, - "output": 0 + "input": 1.1, + "output": 3.3 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-OCR", - "name": "deepseek-ai/DeepSeek-OCR", - "display_name": "deepseek-ai/DeepSeek-OCR", + "id": "route/glm-4.7-flash", + "name": "GLM 4.7 Flash", + "display_name": "GLM 4.7 Flash", "modalities": { "input": [ - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": true, - "release_date": "2025-10-20", - "last_updated": "2025-10-20", + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0, - "output": 0 - } + "input": 1.32, + "output": 4.4, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "deepseek-ai/DeepSeek-V3.1-Terminus", - "display_name": "deepseek-ai/DeepSeek-V3.1-Terminus", + "id": "route/glm-5.1-full", + "name": "GLM 5.1 Full", + "display_name": "GLM 5.1 Full", "modalities": { "input": [ "text" @@ -30846,8 +30866,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 202752, + "output": 202752 }, "temperature": true, "tool_call": true, @@ -30855,20 +30875,33 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.27, - "output": 1 + "input": 1.2, + "output": 3.5, + "cache_read": 0.26, + "cache_write": 0 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "deepseek-ai/DeepSeek-V3.2", - "display_name": "deepseek-ai/DeepSeek-V3.2", + "id": "route/minimax-m2.7", + "name": "MiniMax M2.7", + "display_name": "MiniMax M2.7", "modalities": { "input": [ "text" @@ -30878,8 +30911,8 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 100000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -30889,34 +30922,43 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-03", - "last_updated": "2025-12-03", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.27, - "output": 0.42 + "input": 0.33, + "output": 1.32, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "id": "route/mistral-small-2503", + "name": "Mistral Small 2503", + "display_name": "Mistral Small 2503", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -30924,20 +30966,21 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1", - "name": "deepseek-ai/DeepSeek-R1", - "display_name": "deepseek-ai/DeepSeek-R1", + "id": "route/mimo-v2.5-pro-precision", + "name": "MiMo V2.5 Pro Precision", + "display_name": "MiMo V2.5 Pro Precision", "modalities": { "input": [ "text" @@ -30947,8 +30990,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -30968,19 +31011,37 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.5, - "output": 2.18 + "input": 0.45, + "output": 1.35, + "cache_read": 0.2, + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ] }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "id": "route/stepfun-3.5-flash", + "name": "StepFun 3.5 Flash", + "display_name": "StepFun 3.5 Flash", "modalities": { "input": [ "text" @@ -30990,8 +31051,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -31000,50 +31061,54 @@ "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-29", + "last_updated": "2026-02-13", "cost": { - "input": 0.18, - "output": 0.18 + "input": 0.096, + "output": 0.288, + "cache_read": 0.019 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3", - "name": "deepseek-ai/DeepSeek-V3", - "display_name": "deepseek-ai/DeepSeek-V3", + "id": "route/mistral-large-3", + "name": "Mistral Large 3", + "display_name": "Mistral Large 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2024-12-26", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", "cost": { - "input": 0.25, - "output": 1 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-vl2", - "name": "deepseek-ai/deepseek-vl2", - "display_name": "deepseek-ai/deepseek-vl2", + "id": "route/step-3.5-flash-2603", + "name": "Step 3.5 Flash 2603", + "display_name": "Step 3.5 Flash 2603", "modalities": { "input": [ "text" @@ -31053,90 +31118,128 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-12-13", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.1, + "output": 0.3, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "baidu/ERNIE-4.5-300B-A47B", - "name": "baidu/ERNIE-4.5-300B-A47B", - "display_name": "baidu/ERNIE-4.5-300B-A47B", + "id": "route/mistral-medium-2505", + "name": "Mistral Medium 2505", + "display_name": "Mistral Medium 2505", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-02", - "last_updated": "2025-11-25", + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0.28, - "output": 1.1 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-32B-0414", - "name": "THUDM/GLM-Z1-32B-0414", - "display_name": "THUDM/GLM-Z1-32B-0414", + "id": "route/mimo-v2.5", + "name": "MiMo V2.5", + "display_name": "MiMo V2.5", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.4, + "output": 2, + "cache_read": 0.08, + "context_over_200k": { + "input": 0.8, + "output": 4, + "cache_read": 0.16 + }, + "tiers": [ + { + "input": 0.8, + "output": 4, + "cache_read": 0.16, + "tier": { + "type": "context", + "size": 256000 + } + } + ] }, "type": "chat" }, { - "id": "THUDM/GLM-4-32B-0414", - "name": "THUDM/GLM-4-32B-0414", - "display_name": "THUDM/GLM-4-32B-0414", + "id": "route/deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -31146,28 +31249,42 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.27, - "output": 0.27 + "input": 0.4928, + "output": 0.7392, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "THUDM/GLM-4-9B-0414", - "name": "THUDM/GLM-4-9B-0414", - "display_name": "THUDM/GLM-4-9B-0414", + "id": "route/glm-5.1-precision", + "name": "GLM 5.1 Precision", + "display_name": "GLM 5.1 Precision", "modalities": { "input": [ "text" @@ -31177,90 +31294,136 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 202752, + "output": 202752 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.086, - "output": 0.086 + "input": 1.2, + "output": 3.5, + "cache_read": 0.26, + "cache_write": 0 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-9B-0414", - "name": "THUDM/GLM-Z1-9B-0414", - "display_name": "THUDM/GLM-Z1-9B-0414", + "id": "route/kimi-k2.6-precision", + "name": "Kimi K2.6 Precision", + "display_name": "Kimi K2.6 Precision", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.086, - "output": 0.086 + "input": 0.6468, + "output": 3.388, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "moonshotai/Kimi-K2-Instruct-0905", - "display_name": "moonshotai/Kimi-K2-Instruct-0905", + "id": "route/kimi-k2.6-full", + "name": "Kimi K2.6 Full", + "display_name": "Kimi K2.6 Full", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-08", - "last_updated": "2025-11-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.4, - "output": 2 + "input": 0.462, + "output": 2.42, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "moonshotai/Kimi-K2-Thinking", - "display_name": "moonshotai/Kimi-K2-Thinking", + "id": "route/step-3.5-flash", + "name": "Step 3.5 Flash", + "display_name": "Step 3.5 Flash", "modalities": { "input": [ "text" @@ -31270,8 +31433,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -31279,31 +31442,22 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "release_date": "2025-11-07", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-29", + "last_updated": "2026-02-13", "cost": { - "input": 0.55, - "output": 2.5 + "input": 0.096, + "output": 0.288, + "cache_read": 0.019 }, "type": "chat" }, { - "id": "ByteDance-Seed/Seed-OSS-36B-Instruct", - "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", - "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "id": "route/minimax-m2.5-highspeed", + "name": "MiniMax M2.5 Highspeed", + "display_name": "MiniMax M2.5 Highspeed", "modalities": { "input": [ "text" @@ -31313,13 +31467,14 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 100000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -31327,19 +31482,21 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-04", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", "cost": { - "input": 0.21, - "output": 0.57 + "input": 0.193, + "output": 1.238, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2-Exp", - "name": "deepseek-ai/DeepSeek-V3.2-Exp", - "display_name": "deepseek-ai/DeepSeek-V3.2-Exp", + "id": "route/glm-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ "text" @@ -31349,19 +31506,43 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "cost": { + "input": 1.32, + "output": 4.4, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", - "name": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", - "display_name": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", + "id": "route/glm-5.1-fp16", + "name": "GLM 5.1 FP16", + "display_name": "GLM 5.1 FP16", "modalities": { "input": [ "text" @@ -31371,19 +31552,42 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 202752, + "output": 202752 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", + "cost": { + "input": 1.2, + "output": 3.5, + "cache_read": 0.26, + "cache_write": 0 }, "type": "chat" }, { - "id": "inclusionAI/Ring-1T", - "name": "inclusionAI/Ring-1T", - "display_name": "inclusionAI/Ring-1T", + "id": "route/glm-5", + "name": "GLM 5", + "display_name": "GLM 5", "modalities": { "input": [ "text" @@ -31393,9 +31597,10 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 202752, + "output": 202752 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -31403,15 +31608,31 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "cost": { + "input": 0.792, + "output": 2.53, + "cache_read": 0.2, + "cache_write": 0 + }, "type": "chat" }, { - "id": "inclusionAI/Ling-1T", - "name": "inclusionAI/Ling-1T", - "display_name": "inclusionAI/Ling-1T", + "id": "route/deepseek-v4-flash-full", + "name": "DeepSeek V4 Flash Full", + "display_name": "DeepSeek V4 Flash Full", "modalities": { "input": [ "text" @@ -31421,107 +31642,98 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", + "cost": { + "input": 0.4928, + "output": 0.7392, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "Qwen/Qwen-Image-Edit-2509", - "name": "Qwen/Qwen-Image-Edit-2509", - "display_name": "Qwen/Qwen-Image-Edit-2509", + "id": "route/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ + "text", "image", - "text" + "video" ], "output": [ - "image" - ] - }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, - { - "id": "Qwen/Qwen-Image-Edit", - "name": "Qwen/Qwen-Image-Edit", - "display_name": "Qwen/Qwen-Image-Edit", - "modalities": { - "input": [ - "image", "text" - ], - "output": [ - "image" ] }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, - { - "id": "Qwen/Qwen-Image", - "name": "Qwen/Qwen-Image", - "display_name": "Qwen/Qwen-Image", - "modalities": { - "input": [ - "text" - ], - "output": [ - "image" - ] + "limit": { + "context": 262144, + "output": 262144 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } - }, - { - "id": "Wan-AI/Wan2.2-I2V-A14B", - "name": "Wan-AI/Wan2.2-I2V-A14B", - "display_name": "Wan-AI/Wan2.2-I2V-A14B", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "video" - ] + "supported": true, + "default": true }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, - { - "id": "Wan-AI/Wan2.2-T2V-A14B", - "name": "Wan-AI/Wan2.2-T2V-A14B", - "display_name": "Wan-AI/Wan2.2-T2V-A14B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "video" - ] + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", + "cost": { + "input": 0.462, + "output": 2.42, + "cache_read": 0.16 + }, + "type": "chat" + } + ] + }, + "the-grid-ai": { + "id": "the-grid-ai", + "name": "The Grid AI", + "display_name": "The Grid AI", + "api": "https://api.thegrid.ai/v1", + "doc": "https://thegrid.ai/docs", + "models": [ { - "id": "zai-org/GLM-4.5", - "name": "zai-org/GLM-4.5", - "display_name": "zai-org/GLM-4.5", + "id": "text-max", + "name": "Text Max", + "display_name": "Text Max", "modalities": { "input": [ "text" @@ -31531,19 +31743,25 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-24", + "last_updated": "2026-03-24", "type": "chat" }, { - "id": "stepfun-ai/step3", - "name": "stepfun-ai/step3", - "display_name": "stepfun-ai/step3", + "id": "text-prime", + "name": "Text Prime", + "display_name": "Text Prime", "modalities": { "input": [ "text" @@ -31553,36 +31771,25 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 30000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, + "attachment": false, + "open_weights": false, + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "type": "chat" }, { - "id": "TeleAI/TeleSpeechASR", - "name": "TeleAI/TeleSpeechASR", - "display_name": "TeleAI/TeleSpeechASR", - "modalities": { - "input": [ - "audio" - ], - "output": [ - "text" - ] - }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, - { - "id": "THUDM/GLM-4.1V-9B-Thinking", - "name": "THUDM/GLM-4.1V-9B-Thinking", - "display_name": "THUDM/GLM-4.1V-9B-Thinking", + "id": "text-standard", + "name": "Text Standard", + "display_name": "Text Standard", "modalities": { "input": [ "text" @@ -31592,20 +31799,34 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "attachment": false, + "open_weights": false, + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "type": "chat" - }, + } + ] + }, + "fastrouter": { + "id": "fastrouter", + "name": "FastRouter", + "display_name": "FastRouter", + "api": "https://go.fastrouter.ai/api/v1", + "doc": "https://fastrouter.ai/models", + "models": [ { - "id": "Pro/THUDM/GLM-4.1V-9B-Thinking", - "name": "Pro/THUDM/GLM-4.1V-9B-Thinking", - "display_name": "Pro/THUDM/GLM-4.1V-9B-Thinking", + "id": "deepseek-ai/deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ "text" @@ -31616,19 +31837,34 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 131072 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-01-23", + "last_updated": "2025-01-23", + "cost": { + "input": 0.03, + "output": 0.14 + }, "type": "chat" }, { - "id": "moonshotai/Kimi-Dev-72B", - "name": "moonshotai/Kimi-Dev-72B", - "display_name": "moonshotai/Kimi-Dev-72B", + "id": "moonshotai/kimi-k2", + "name": "Kimi K2", + "display_name": "Kimi K2", "modalities": { "input": [ "text" @@ -31639,18 +31875,28 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", + "cost": { + "input": 0.55, + "output": 2.2 + }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M1-80k", - "name": "MiniMaxAI/MiniMax-M1-80k", - "display_name": "MiniMaxAI/MiniMax-M1-80k", + "id": "z-ai/glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -31660,19 +31906,40 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 204800, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "cost": { + "input": 0.95, + "output": 3.15 }, "type": "chat" }, { - "id": "Tongyi-Zhiwen/QwenLong-L1-32B", - "name": "Tongyi-Zhiwen/QwenLong-L1-32B", - "display_name": "Tongyi-Zhiwen/QwenLong-L1-32B", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -31683,308 +31950,586 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.05, + "output": 0.2 + }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", - "name": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", - "display_name": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 + }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B", - "name": "Qwen/Qwen3-30B-A3B", - "display_name": "Qwen/Qwen3-30B-A3B", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.025 + }, "type": "chat" }, { - "id": "Qwen/Qwen3-Reranker-8B", - "name": "Qwen/Qwen3-Reranker-8B", - "display_name": "Qwen/Qwen3-Reranker-8B", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" ], "output": [ - "score" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 131072, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - }, - "type": "rerank" - }, - { - "id": "Qwen/Qwen3-Embedding-8B", - "name": "Qwen/Qwen3-Embedding-8B", - "display_name": "Qwen/Qwen3-Embedding-8B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "embedding" - ] + "supported": true, + "default": true }, - "limit": { - "context": 8192, - "output": 2048 + "extra_capabilities": { + "reasoning": { + "supported": true + } }, - "tool_call": false, - "reasoning": { - "supported": false + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.15, + "output": 0.6 }, - "type": "embedding" + "type": "chat" }, { - "id": "Qwen/Qwen3-Reranker-4B", - "name": "Qwen/Qwen3-Reranker-4B", - "display_name": "Qwen/Qwen3-Reranker-4B", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "score" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "rerank" + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + }, + "type": "chat" }, { - "id": "Qwen/Qwen3-Embedding-4B", - "name": "Qwen/Qwen3-Embedding-4B", - "display_name": "Qwen/Qwen3-Embedding-4B", + "id": "x-ai/grok-4", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ "text" ], "output": [ - "embedding" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 256000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.75, + "cache_write": 15 + }, + "type": "chat" }, { - "id": "Qwen/Qwen3-Reranker-0.6B", - "name": "Qwen/Qwen3-Reranker-0.6B", - "display_name": "Qwen/Qwen3-Reranker-0.6B", + "id": "qwen/qwen3-coder", + "name": "Qwen3 Coder", + "display_name": "Qwen3 Coder", "modalities": { "input": [ "text" ], "output": [ - "score" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 262144, + "output": 66536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "rerank" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "cost": { + "input": 0.3, + "output": 1.2 + }, + "type": "chat" }, { - "id": "Qwen/Qwen3-Embedding-0.6B", - "name": "Qwen/Qwen3-Embedding-0.6B", - "display_name": "Qwen/Qwen3-Embedding-0.6B", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "embedding" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 1048576, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.31 + }, + "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B", - "name": "Qwen/Qwen3-235B-A22B", - "display_name": "Qwen/Qwen3-235B-A22B", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.0375 + }, "type": "chat" }, { - "id": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", - "name": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", - "display_name": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1047576, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 2, + "output": 8, + "cache_read": 0.5 + }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "id": "anthropic/claude-opus-4.1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 32000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + }, "type": "chat" }, { - "id": "Qwen/QVQ-72B-Preview", - "name": "Qwen/QVQ-72B-Preview", - "display_name": "Qwen/QVQ-72B-Preview", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + }, "type": "chat" - }, + } + ] + }, + "tencent-coding-plan": { + "id": "tencent-coding-plan", + "name": "Tencent Coding Plan (China)", + "display_name": "Tencent Coding Plan (China)", + "api": "https://api.lkeap.cloud.tencent.com/coding/v3", + "doc": "https://cloud.tencent.com/document/product/1772/128947", + "models": [ { - "id": "deepseek-ai/DeepSeek-V2.5", - "name": "deepseek-ai/DeepSeek-V2.5", - "display_name": "deepseek-ai/DeepSeek-V2.5", + "id": "kimi-k2.5", + "name": "Kimi-K2.5", + "display_name": "Kimi-K2.5", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" + }, + { + "id": "hunyuan-turbos", + "name": "Hunyuan-TurboS", + "display_name": "Hunyuan-TurboS", "modalities": { "input": [ "text" @@ -31995,86 +32540,185 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-08", + "last_updated": "2026-03-08", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, "type": "chat" }, { - "id": "fnlp/MOSS-TTSD-v0.5", - "name": "fnlp/MOSS-TTSD-v0.5", - "display_name": "fnlp/MOSS-TTSD-v0.5", + "id": "hunyuan-2.0-thinking", + "name": "Tencent HY 2.0 Think", + "display_name": "Tencent HY 2.0 Think", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, - "tool_call": false, + "limit": { + "context": 131072, + "output": 16384 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-08", + "last_updated": "2026-03-08", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" }, { - "id": "FunAudioLLM/CosyVoice2-0.5B", - "name": "FunAudioLLM/CosyVoice2-0.5B", - "display_name": "FunAudioLLM/CosyVoice2-0.5B", + "id": "hunyuan-2.0-instruct", + "name": "Tencent HY 2.0 Instruct", + "display_name": "Tencent HY 2.0 Instruct", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, - "tool_call": false, + "limit": { + "context": 131072, + "output": 16384 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false - } + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-08", + "last_updated": "2026-03-08", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" }, { - "id": "FunAudioLLM/SenseVoiceSmall", - "name": "FunAudioLLM/SenseVoiceSmall", - "display_name": "FunAudioLLM/SenseVoiceSmall", + "id": "tc-code-latest", + "name": "Auto", + "display_name": "Auto", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, - "tool_call": false, + "limit": { + "context": 131072, + "output": 16384 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false - } + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-08", + "last_updated": "2026-03-08", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" }, { - "id": "IndexTeam/IndexTTS-2", - "name": "IndexTeam/IndexTTS-2", - "display_name": "IndexTeam/IndexTTS-2", + "id": "minimax-m2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, - "tool_call": false, + "limit": { + "context": 204800, + "output": 32768 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" }, { - "id": "BAAI/bge-m3", - "name": "BAAI/bge-m3", - "display_name": "BAAI/bge-m3", + "id": "hunyuan-t1", + "name": "Hunyuan-T1", + "display_name": "Hunyuan-T1", "modalities": { "input": [ "text" @@ -32085,100 +32729,224 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-08", + "last_updated": "2026-03-08", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" }, { - "id": "BAAI/bge-reranker-v2-m3", - "name": "BAAI/bge-reranker-v2-m3", - "display_name": "BAAI/bge-reranker-v2-m3", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" ], "output": [ - "score" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 202752, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "rerank" - }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" + } + ] + }, + "cortecs": { + "id": "cortecs", + "name": "Cortecs", + "display_name": "Cortecs", + "api": "https://api.cortecs.ai/v1", + "doc": "https://api.cortecs.ai/v1/models", + "models": [ { - "id": "netease-youdao/bce-embedding-base_v1", - "name": "netease-youdao/bce-embedding-base_v1", - "display_name": "netease-youdao/bce-embedding-base_v1", + "id": "minimax-m2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" ], "output": [ - "embedding" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 196000, + "output": 196000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "cost": { + "input": 0.34, + "output": 1.34 + }, + "type": "chat" }, { - "id": "netease-youdao/bce-reranker-base_v1", - "name": "netease-youdao/bce-reranker-base_v1", - "display_name": "netease-youdao/bce-reranker-base_v1", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "score" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "cost": { + "input": 0.55, + "output": 2.76 + }, + "type": "chat" }, { - "id": "Kwai-Kolors/Kolors", - "name": "Kwai-Kolors/Kolors", - "display_name": "Kwai-Kolors/Kolors", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "image" + "text" ] }, - "tool_call": false, + "limit": { + "context": 200000, + "output": 200000 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "cost": { + "input": 1.09, + "output": 5.43 + }, + "type": "chat" }, { - "id": "Qwen/Qwen2-VL-72B-Instruct", - "name": "Qwen/Qwen2-VL-72B-Instruct", - "display_name": "Qwen/Qwen2-VL-72B-Instruct", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -32188,62 +32956,131 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 204800, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-04-14", + "last_updated": "2026-04-14", + "cost": { + "input": 1.31, + "output": 4.1, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-Coder-7B-Instruct", - "name": "Qwen/Qwen2.5-Coder-7B-Instruct", - "display_name": "Qwen/Qwen2.5-Coder-7B-Instruct", + "id": "claude-opus4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", + "cost": { + "input": 5.6, + "output": 27.99, + "cache_read": 0.56, + "cache_write": 6.99 + }, + "type": "chat" }, { - "id": "internlm/internlm2_5-7b-chat", - "name": "internlm/internlm2_5-7b-chat", - "display_name": "internlm/internlm2_5-7b-chat", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 65535 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-17", + "cost": { + "input": 1.654, + "output": 11.024 }, "type": "chat" }, { - "id": "Qwen/Qwen2-7B-Instruct", - "name": "Qwen/Qwen2-7B-Instruct", - "display_name": "Qwen/Qwen2-7B-Instruct", + "id": "minimax-m2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ "text" @@ -32253,19 +33090,41 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 400000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "cost": { + "input": 0.39, + "output": 1.57 }, "type": "chat" }, { - "id": "THUDM/glm-4-9b-chat", - "name": "THUDM/glm-4-9b-chat", - "display_name": "THUDM/glm-4-9b-chat", + "id": "kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -32275,19 +33134,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 131000, + "output": 131000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-07-11", + "last_updated": "2025-09-05", + "cost": { + "input": 0.551, + "output": 2.646 + }, "type": "chat" }, { - "id": "BAAI/bge-large-en-v1.5", - "name": "BAAI/bge-large-en-v1.5", - "display_name": "BAAI/bge-large-en-v1.5", + "id": "deepseek-r1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ "text" @@ -32297,19 +33166,41 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 164000, + "output": 164000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", + "cost": { + "input": 0.585, + "output": 2.307 + }, + "type": "chat" }, { - "id": "BAAI/bge-large-zh-v1.5", - "name": "BAAI/bge-large-zh-v1.5", - "display_name": "BAAI/bge-large-zh-v1.5", + "id": "deepseek-v3-0324", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ "text" @@ -32319,19 +33210,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "embedding" + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", + "cost": { + "input": 0.551, + "output": 1.654 + }, + "type": "chat" }, { - "id": "LoRA/Qwen/Qwen2.5-32B-Instruct", - "name": "LoRA/Qwen/Qwen2.5-32B-Instruct", - "display_name": "LoRA/Qwen/Qwen2.5-32B-Instruct", + "id": "codestral-2508", + "name": "Codestral 2508", + "display_name": "Codestral 2508", "modalities": { "input": [ "text" @@ -32341,19 +33242,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 256000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-03", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", + "cost": { + "input": 0.3, + "output": 0.9, + "cache_read": 0.03 + }, "type": "chat" }, { - "id": "LoRA/Qwen/Qwen2.5-14B-Instruct", - "name": "LoRA/Qwen/Qwen2.5-14B-Instruct", - "display_name": "LoRA/Qwen/Qwen2.5-14B-Instruct", + "id": "qwen-2.5-72b-instruct", + "name": "Qwen2.5 72B Instruct", + "display_name": "Qwen2.5 72B Instruct", "modalities": { "input": [ "text" @@ -32363,19 +33275,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 33000, + "output": 33000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2024-09-19", + "last_updated": "2024-09-19", + "cost": { + "input": 0.062, + "output": 0.231 + }, "type": "chat" }, { - "id": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "name": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "display_name": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "id": "deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -32385,20 +33307,35 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 163840, + "output": 163840 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "cost": { + "input": 0.266, + "output": 0.444 + }, "type": "chat" }, { - "id": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", - "name": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", - "display_name": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", + "id": "hermes-4-70b", + "name": "Hermes 4 70B", + "display_name": "Hermes 4 70B", "modalities": { "input": [ "text" @@ -32408,18 +33345,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", + "cost": { + "input": 0.116, + "output": 0.358 + }, + "type": "chat" }, { - "id": "Pro/BAAI/bge-m3", - "name": "Pro/BAAI/bge-m3", - "display_name": "Pro/BAAI/bge-m3", + "id": "devstral-2512", + "name": "Devstral 2 2512", + "display_name": "Devstral 2 2512", "modalities": { "input": [ "text" @@ -32429,63 +33378,97 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262000, + "output": 262000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "embedding" + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" }, { - "id": "Pro/Qwen/Qwen2.5-7B-Instruct", - "name": "Pro/Qwen/Qwen2.5-7B-Instruct", - "display_name": "Pro/Qwen/Qwen2.5-7B-Instruct", + "id": "claude-opus4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 200000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", + "cost": { + "input": 5.98, + "output": 29.89 }, "type": "chat" }, { - "id": "Pro/BAAI/bge-reranker-v2-m3", - "name": "Pro/BAAI/bge-reranker-v2-m3", - "display_name": "Pro/BAAI/bge-reranker-v2-m3", + "id": "glm-4.5-air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", "modalities": { "input": [ "text" ], "output": [ - "score" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "rerank" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-01", + "last_updated": "2025-08-01", + "cost": { + "input": 0.22, + "output": 1.34 + }, + "type": "chat" }, { - "id": "LoRA/Qwen/Qwen2.5-72B-Instruct", - "name": "LoRA/Qwen/Qwen2.5-72B-Instruct", - "display_name": "LoRA/Qwen/Qwen2.5-72B-Instruct", + "id": "minimax-m2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -32495,19 +33478,40 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 196608, + "output": 196608 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "cost": { + "input": 0.32, + "output": 1.18 }, "type": "chat" }, { - "id": "Pro/Qwen/Qwen2-7B-Instruct", - "name": "Pro/Qwen/Qwen2-7B-Instruct", - "display_name": "Pro/Qwen/Qwen2-7B-Instruct", + "id": "glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ "text" @@ -32517,63 +33521,107 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 203000, + "output": 203000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", + "cost": { + "input": 0.09, + "output": 0.53 }, "type": "chat" }, { - "id": "LoRA/Qwen/Qwen2.5-7B-Instruct", - "name": "LoRA/Qwen/Qwen2.5-7B-Instruct", - "display_name": "LoRA/Qwen/Qwen2.5-7B-Instruct", + "id": "devstral-small-2512", + "name": "Devstral Small 2 2512", + "display_name": "Devstral Small 2 2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262000, + "output": 262000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "Pro/THUDM/glm-4-9b-chat", - "name": "Pro/THUDM/glm-4-9b-chat", - "display_name": "Pro/THUDM/glm-4-9b-chat", + "id": "gpt-4.1", + "name": "GPT 4.1", + "display_name": "GPT 4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1047576, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 2.354, + "output": 9.417 + }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-Rumination-32B-0414", - "name": "THUDM/GLM-Z1-Rumination-32B-0414", - "display_name": "THUDM/GLM-Z1-Rumination-32B-0414", + "id": "glm-4.5", + "name": "GLM 4.5", + "display_name": "GLM 4.5", "modalities": { "input": [ "text" @@ -32584,189 +33632,381 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", + "cost": { + "input": 0.67, + "output": 2.46 + }, "type": "chat" }, { - "id": "stabilityai/stable-diffusion-xl-base-1.0", - "name": "stabilityai/stable-diffusion-xl-base-1.0", - "display_name": "stabilityai/stable-diffusion-xl-base-1.0", + "id": "qwen3-coder-next", + "name": "Qwen3 Coder Next 80B", + "display_name": "Qwen3 Coder Next 80B", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, - "tool_call": false, + "limit": { + "context": 256000, + "output": 65536 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-04", + "last_updated": "2026-02-04", + "cost": { + "input": 0.158, + "output": 0.84 + }, + "type": "chat" }, { - "id": "black-forest-labs/FLUX.1-schnell", - "name": "black-forest-labs/FLUX.1-schnell", - "display_name": "black-forest-labs/FLUX.1-schnell", + "id": "minimax-m2.7", + "name": "MiniMax-m2.7", + "display_name": "MiniMax-m2.7", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, - "tool_call": false, + "limit": { + "context": 202752, + "output": 196072 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0.47, + "output": 1.4 + }, + "type": "chat" }, { - "id": "black-forest-labs/FLUX.1-dev", - "name": "black-forest-labs/FLUX.1-dev", - "display_name": "black-forest-labs/FLUX.1-dev", + "id": "intellect-3", + "name": "INTELLECT 3", + "display_name": "INTELLECT 3", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, - { - "id": "Pro/black-forest-labs/FLUX.1-schnell", - "name": "Pro/black-forest-labs/FLUX.1-schnell", - "display_name": "Pro/black-forest-labs/FLUX.1-schnell", - "modalities": { - "input": [ - "text" - ], - "output": [ - "image" - ] + "limit": { + "context": 128000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2025-11-26", + "last_updated": "2025-11-26", + "cost": { + "input": 0.219, + "output": 1.202 + }, + "type": "chat" }, { - "id": "stabilityai/stable-diffusion-3-5-large", - "name": "stabilityai/stable-diffusion-3-5-large", - "display_name": "stabilityai/stable-diffusion-3-5-large", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, - "tool_call": false, + "limit": { + "context": 16384, + "output": 16384 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", + "cost": { + "input": 0.099, + "output": 0.33 + }, + "type": "chat" }, { - "id": "fishaudio/fish-speech-1.4", - "name": "fishaudio/fish-speech-1.4", - "display_name": "fishaudio/fish-speech-1.4", + "id": "qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, - "tool_call": false, + "limit": { + "context": 128000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-11", + "last_updated": "2025-09-11", + "cost": { + "input": 0.164, + "output": 1.311 + }, + "type": "chat" }, { - "id": "RVC-Boss/GPT-SoVITS", - "name": "RVC-Boss/GPT-SoVITS", - "display_name": "RVC-Boss/GPT-SoVITS", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, - "tool_call": false, + "limit": { + "context": 262000, + "output": 262000 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", + "cost": { + "input": 0.656, + "output": 2.731 + }, + "type": "chat" }, { - "id": "fishaudio/fish-speech-1.5", - "name": "fishaudio/fish-speech-1.5", - "display_name": "fishaudio/fish-speech-1.5", + "id": "nemotron-3-super-120b-a12b", + "name": "Nemotron 3 Super 120B A12B", + "display_name": "Nemotron 3 Super 120B A12B", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, - "tool_call": false, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-03-11", + "last_updated": "2026-03-11", + "cost": { + "input": 0.266, + "output": 0.799 + }, + "type": "chat" }, { - "id": "black-forest-labs/FLUX.1-pro", - "name": "black-forest-labs/FLUX.1-pro", - "display_name": "black-forest-labs/FLUX.1-pro", + "id": "nova-pro-v1", + "name": "Nova Pro 1.0", + "display_name": "Nova Pro 1.0", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, - "tool_call": false, + "limit": { + "context": 300000, + "output": 5000 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false - } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", + "cost": { + "input": 1.016, + "output": 4.061 + }, + "type": "chat" }, { - "id": "LoRA/black-forest-labs/FLUX.1-dev", - "name": "LoRA/black-forest-labs/FLUX.1-dev", - "display_name": "LoRA/black-forest-labs/FLUX.1-dev", + "id": "claude-4-5-sonnet", + "name": "Claude 4.5 Sonnet", + "display_name": "Claude 4.5 Sonnet", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "image" + "text" ] }, - "tool_call": false, + "limit": { + "context": 200000, + "output": 200000 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "cost": { + "input": 3.259, + "output": 16.296 + }, + "type": "chat" }, { - "id": "SeedLLM/Seed-Rice-7B", - "name": "SeedLLM/Seed-Rice-7B", - "display_name": "SeedLLM/Seed-Rice-7B", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -32776,39 +34016,43 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 131000, + "output": 131000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "cost": { + "input": 0.062, + "output": 0.408 }, "type": "chat" - } - ] - }, - "submodel": { - "id": "submodel", - "name": "submodel", - "display_name": "submodel", - "api": "https://llm.submodel.ai/v1", - "doc": "https://submodel.gitbook.io", - "models": [ + }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -32816,50 +34060,55 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.2, - "output": 0.3 + "input": 3.307, + "output": 16.536 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "claude-opus4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 1000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.2, - "output": 0.8 + "input": 5.98, + "output": 29.89 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -32869,40 +34118,29 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "knowledge": "2025-01", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 0.2, - "output": 0.6 + "input": 0.441, + "output": 1.984 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5-Air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "llama-3.1-405b-instruct", + "name": "Llama 3.1 405B Instruct", + "display_name": "Llama 3.1 405B Instruct", "modalities": { "input": [ "text" @@ -32912,8 +34150,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -32922,18 +34160,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.1, - "output": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5-FP8", - "name": "GLM 4.5 FP8", - "display_name": "GLM 4.5 FP8", + "id": "glm-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ "text" @@ -32943,8 +34182,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 198000, + "output": 198000 }, "temperature": true, "tool_call": true, @@ -32952,20 +34191,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.45, + "output": 2.23 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "gpt-oss-120b", + "name": "GPT Oss 120b", + "display_name": "GPT Oss 120b", "modalities": { "input": [ "text" @@ -32975,29 +34226,34 @@ ] }, "limit": { - "context": 75000, - "output": 163840 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "open_weights": true, + "knowledge": "2024-01", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3-0324", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "mixtral-8x7B-instruct-v0.1", + "name": "Mixtral 8x7B Instruct v0.1", + "display_name": "Mixtral 8x7B Instruct v0.1", "modalities": { "input": [ "text" @@ -33007,28 +34263,30 @@ ] }, "limit": { - "context": 75000, - "output": 163840 + "context": 32000, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "open_weights": true, + "knowledge": "2023-09", + "release_date": "2023-12-11", + "last_updated": "2023-12-11", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.438, + "output": 0.68 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", + "id": "glm-5", + "name": "GLM 5", + "display_name": "GLM 5", "modalities": { "input": [ "text" @@ -33038,8 +34296,8 @@ ] }, "limit": { - "context": 75000, - "output": 163840 + "context": 202752, + "output": 202752 }, "temperature": true, "tool_call": true, @@ -33059,30 +34317,31 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.5, - "output": 2.15 + "input": 1.08, + "output": 3.44 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -33092,43 +34351,43 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.1, - "output": 0.5 + "input": 0.81, + "output": 3.54, + "cache_read": 0.2 }, "type": "chat" - } - ] - }, - "minimax-coding-plan": { - "id": "minimax-coding-plan", - "name": "MiniMax Coding Plan (minimax.io)", - "display_name": "MiniMax Coding Plan (minimax.io)", - "api": "https://api.minimax.io/anthropic/v1", - "doc": "https://platform.minimax.io/docs/coding-plan/intro", - "models": [ + }, { - "id": "MiniMax-M2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "claude-4-6-sonnet", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 128000 + "context": 1000000, + "output": 1000000 }, "temperature": true, "tool_call": true, @@ -33136,64 +34395,55 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0, - "output": 0 + "input": 3.59, + "output": 17.92 }, "type": "chat" }, { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "mistral-large-2512", + "name": "Mistral Large 3 2512", + "display_name": "Mistral Large 3 2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2025-12", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.5, + "output": 1.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -33203,8 +34453,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1048576, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -33225,20 +34475,20 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 1.553, + "output": 3.106, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "MiniMax-M2.7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "qwen3.5-122b-a10b", + "name": "Qwen3.5 122B A10B", + "display_name": "Qwen3.5 122B A10B", "modalities": { "input": [ "text" @@ -33248,8 +34498,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -33270,20 +34520,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2026-01", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.444, + "output": 3.106 }, "type": "chat" }, { - "id": "MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "qwen3.5-397b-a17b", + "name": "Qwen3.5 397B A17B", + "display_name": "Qwen3.5 397B A17B", "modalities": { "input": [ "text" @@ -33293,8 +34542,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 250000, + "output": 250000 }, "temperature": true, "tool_call": true, @@ -33304,23 +34553,30 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2026-01", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "MiniMax-M2.5-highspeed", - "name": "MiniMax-M2.5-highspeed", - "display_name": "MiniMax-M2.5-highspeed", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -33330,8 +34586,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1048576, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -33341,66 +34597,64 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2026-02-13", - "last_updated": "2026-02-13", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.133, + "output": 0.266, + "cache_read": 0.028 }, "type": "chat" - } - ] - }, - "perplexity": { - "id": "perplexity", - "name": "Perplexity", - "display_name": "Perplexity", - "doc": "https://docs.perplexity.ai", - "models": [ + }, { - "id": "sonar-pro", - "name": "Sonar Pro", - "display_name": "Sonar Pro", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 262000, + "output": 262000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "cost": { - "input": 3, - "output": 15 + "input": 0.053, + "output": 0.222 }, "type": "chat" }, { - "id": "sonar-deep-research", - "name": "Perplexity Sonar Deep Research", - "display_name": "Perplexity Sonar Deep Research", + "id": "llama-3.3-70b-instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -33410,31 +34664,39 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131000, + "output": 131000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-02-01", - "last_updated": "2025-09-01", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 2, - "output": 8, - "reasoning": 3 + "input": 0.089, + "output": 0.275 }, "type": "chat" - }, + } + ] + }, + "baseten": { + "id": "baseten", + "name": "Baseten", + "display_name": "Baseten", + "api": "https://inference.baseten.co/v1", + "doc": "https://docs.baseten.co/development/model-apis/overview", + "models": [ { - "id": "sonar", - "name": "Sonar", - "display_name": "Sonar", + "id": "deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text" @@ -33444,72 +34706,61 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 164000, + "output": 131000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "open_weights": true, + "release_date": "2025-08-25", + "last_updated": "2025-08-25", "cost": { - "input": 1, - "output": 1 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "sonar-reasoning-pro", - "name": "Sonar Reasoning Pro", - "display_name": "Sonar Reasoning Pro", + "id": "deepseek-ai/DeepSeek-V3-0324", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 164000, + "output": 131000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 2, - "output": 8 + "input": 0.77, + "output": 0.77 }, "type": "chat" - } - ] - }, - "deepseek": { - "id": "deepseek", - "name": "DeepSeek", - "display_name": "DeepSeek", - "api": "https://api.deepseek.com", - "doc": "https://api-docs.deepseek.com/zh-cn/quick_start/pricing", - "models": [ + }, { - "id": "deepseek-chat", - "name": "DeepSeek Chat", - "display_name": "DeepSeek Chat", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -33519,30 +34770,41 @@ ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 163800, + "output": 131100 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2025-09", - "release_date": "2024-12-26", - "last_updated": "2026-04-24", + "knowledge": "2025-10", + "release_date": "2025-12-01", + "last_updated": "2026-03-06", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 0.3, + "output": 0.45 }, "type": "chat" }, { - "id": "deepseek-reasoner", - "name": "DeepSeek Reasoner", - "display_name": "DeepSeek Reasoner", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -33552,10 +34814,10 @@ ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -33564,50 +34826,42 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Compatibility alias for deepseek-v4-flash thinking mode." ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-01-20", - "last_updated": "2026-04-24", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2026-03-06", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 0.6, + "output": 2.5 }, "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -33618,39 +34872,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Thinking mode is controlled through the thinking parameter; non-thinking mode disables reasoning." ] } }, "attachment": true, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text" @@ -33660,8 +34905,8 @@ ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 262144, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -33672,48 +34917,29 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Thinking mode is controlled through the thinking parameter; non-thinking mode disables reasoning." ] } }, "attachment": true, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "knowledge": "2025-12", + "release_date": "2026-01-30", + "last_updated": "2026-02-12", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 0.6, + "output": 3 }, "type": "chat" - } - ] - }, - "llama": { - "id": "llama", - "name": "Llama", - "display_name": "Llama", - "api": "https://api.llama.com/compat/v1/", - "doc": "https://llama.developer.meta.com/docs/models", - "models": [ + }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi K2 Instruct 0905", + "display_name": "Kimi K2 Instruct 0905", "modalities": { "input": [ "text" @@ -33723,30 +34949,30 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2025-08", + "release_date": "2025-09-05", + "last_updated": "2026-03-06", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 2.5 }, "type": "chat" }, { - "id": "cerebras-llama-4-maverick-17b-128e-instruct", - "name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", - "display_name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", - "modalities": { + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", + "modalities": { "input": [ "text" ], @@ -33756,28 +34982,34 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.5 }, "type": "chat" }, { - "id": "llama-3.3-8b-instruct", - "name": "Llama-3.3-8B-Instruct", - "display_name": "Llama-3.3-8B-Instruct", + "id": "zai-org/GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -33787,29 +35019,41 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "cerebras-llama-4-scout-17b-16e-instruct", - "name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", - "display_name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", + "id": "zai-org/GLM-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -33819,29 +35063,41 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2026-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0, - "output": 0 + "input": 0.95, + "output": 3.15 }, "type": "chat" }, { - "id": "groq-llama-4-maverick-17b-128e-instruct", - "name": "Groq-Llama-4-Maverick-17B-128E-Instruct", - "display_name": "Groq-Llama-4-Maverick-17B-128E-Instruct", + "id": "zai-org/GLM-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ "text" @@ -33851,104 +35107,122 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 200000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2025-08-31", + "release_date": "2025-09-16", + "last_updated": "2025-09-16", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "llama-4-scout-17b-16e-instruct-fp8", - "name": "Llama-4-Scout-17B-16E-Instruct-FP8", - "display_name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "id": "nvidia/Nemotron-120B-A12B", + "name": "Nemotron 3 Super", + "display_name": "Nemotron 3 Super", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 32678 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2026-02", + "release_date": "2026-03-11", + "last_updated": "2026-03-11", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 0.75 }, "type": "chat" }, { - "id": "llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", - "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 204000, + "output": 204000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2026-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 1.2 }, "type": "chat" - } - ] - }, - "fireworks-ai": { - "id": "fireworks-ai", - "name": "Fireworks AI", - "display_name": "Fireworks AI", - "api": "https://api.fireworks.ai/inference/v1/", - "doc": "https://fireworks.ai/docs/", - "models": [ + }, { - "id": "accounts/fireworks/models/glm-5p1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "deepseek-ai/DeepSeek-V4-Pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -33958,8 +35232,8 @@ ] }, "limit": { - "context": 202800, - "output": 131072 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -33980,19 +35254,62 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 1.74, + "output": 3.48, + "cache_read": 0.15 + }, + "type": "chat" + } + ] + }, + "llama": { + "id": "llama", + "name": "Llama", + "display_name": "Llama", + "api": "https://api.llama.com/compat/v1/", + "doc": "https://llama.developer.meta.com/docs/models", + "models": [ + { + "id": "llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "cost": { + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "accounts/fireworks/models/deepseek-v3p2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "cerebras-llama-4-scout-17b-16e-instruct", + "name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", + "display_name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", "modalities": { "input": [ "text" @@ -34002,42 +35319,29 @@ ] }, "limit": { - "context": 160000, - "output": 160000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2025-01", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.56, - "output": 1.68, - "cache_read": 0.28 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "accounts/fireworks/models/minimax-m2p5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "llama-3.3-8b-instruct", + "name": "Llama-3.3-8B-Instruct", + "display_name": "Llama-3.3-8B-Instruct", "modalities": { "input": [ "text" @@ -34047,41 +35351,62 @@ ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0, + "output": 0 }, - "attachment": false, + "type": "chat" + }, + { + "id": "llama-4-scout-17b-16e-instruct-fp8", + "name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "display_name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "accounts/fireworks/models/glm-4p5-air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "cerebras-llama-4-maverick-17b-128e-instruct", + "name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", + "display_name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", "modalities": { "input": [ "text" @@ -34091,30 +35416,29 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-01", - "last_updated": "2025-08-01", + "knowledge": "2025-01", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.22, - "output": 0.88 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "accounts/fireworks/models/glm-5", - "name": "GLM 5", - "display_name": "GLM 5", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -34124,41 +35448,29 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "accounts/fireworks/models/deepseek-v3p1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "groq-llama-4-maverick-17b-128e-instruct", + "name": "Groq-Llama-4-Maverick-17B-128E-Instruct", + "display_name": "Groq-Llama-4-Maverick-17B-128E-Instruct", "modalities": { "input": [ "text" @@ -34168,42 +35480,51 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "knowledge": "2025-01", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.56, - "output": 1.68 + "input": 0, + "output": 0 }, "type": "chat" - }, + } + ] + }, + "novita-ai": { + "id": "novita-ai", + "name": "NovitaAI", + "display_name": "NovitaAI", + "api": "https://api.novita.ai/openai", + "doc": "https://novita.ai/docs/guides/introduction", + "models": [ { - "id": "accounts/fireworks/models/kimi-k2p6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -34222,21 +35543,22 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "accounts/fireworks/models/kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "moonshotai/kimi-k2-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -34246,8 +35568,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -34257,52 +35579,49 @@ "attachment": false, "open_weights": true, "knowledge": "2024-10", - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 1, - "output": 3 + "input": 0.6, + "output": 2.5 }, "type": "chat" }, { - "id": "accounts/fireworks/models/qwen3p6-plus", - "name": "Qwen 3.6 Plus", - "display_name": "Qwen 3.6 Plus", + "id": "moonshotai/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-04", - "last_updated": "2026-04-04", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-11", + "last_updated": "2025-07-11", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.1 + "input": 0.57, + "output": 2.3 }, "type": "chat" }, { - "id": "accounts/fireworks/models/minimax-m2p1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -34312,8 +35631,8 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -34334,74 +35653,68 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "release_date": "2025-11-07", + "last_updated": "2025-11-07", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 0.6, + "output": 2.5 }, "type": "chat" }, { - "id": "accounts/fireworks/models/minimax-m2p7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "openai/gpt-oss-20b", + "name": "OpenAI: GPT OSS 20B", + "display_name": "OpenAI: GPT OSS 20B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-04-12", - "last_updated": "2026-04-12", + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 0.04, + "output": 0.15 }, "type": "chat" }, { - "id": "accounts/fireworks/models/glm-4p7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "openai/gpt-oss-120b", + "name": "OpenAI GPT OSS 120B", + "display_name": "OpenAI GPT OSS 120B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 198000, - "output": 198000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -34411,31 +35724,23 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.3 + "input": 0.05, + "output": 0.25 }, "type": "chat" }, { - "id": "accounts/fireworks/models/glm-4p5", - "name": "GLM 4.5", - "display_name": "GLM 4.5", + "id": "zai-org/glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -34445,7 +35750,7 @@ ] }, "limit": { - "context": 131072, + "context": 204800, "output": 131072 }, "temperature": true, @@ -34467,32 +35772,65 @@ }, "attachment": false, "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", + "cost": { + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 + }, + "type": "chat" + }, + { + "id": "zai-org/glm-4.5-air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 98304 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "release_date": "2025-10-13", + "last_updated": "2025-10-13", "cost": { - "input": 0.55, - "output": 2.19 + "input": 0.13, + "output": 0.85 }, "type": "chat" }, { - "id": "accounts/fireworks/models/kimi-k2p5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "zai-org/glm-4.5v", + "name": "GLM 4.5V", + "display_name": "GLM 4.5V", "modalities": { "input": [ "text", - "image", - "video" + "video", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 65536, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -34500,33 +35838,22 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "cost": { "input": 0.6, - "output": 3, - "cache_read": 0.1 + "output": 1.8, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "accounts/fireworks/models/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "zai-org/glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ "text" @@ -34536,8 +35863,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -34552,18 +35879,20 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.05, - "output": 0.2 + "input": 0.07, + "output": 0.4, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "accounts/fireworks/models/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "zai-org/glm-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ "text" @@ -34573,8 +35902,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -34584,23 +35913,30 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.55, + "output": 2.2, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "accounts/fireworks/models/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "zai-org/glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -34610,8 +35946,8 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -34632,19 +35968,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { "input": 0.6, - "output": 2.5, - "cache_read": 0.3 + "output": 2.2, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "accounts/fireworks/routers/kimi-k2p5-turbo", - "name": "Kimi K2.5 Turbo", - "display_name": "Kimi K2.5 Turbo", + "id": "zai-org/autoglm-phone-9b-multilingual", + "name": "AutoGLM-Phone-9B-Multilingual", + "display_name": "AutoGLM-Phone-9B-Multilingual", "modalities": { "input": [ "text", @@ -34655,8 +35991,39 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 65536, + "output": 65536 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-12-10", + "last_updated": "2025-12-10", + "cost": { + "input": 0.035, + "output": 0.138 + }, + "type": "chat" + }, + { + "id": "zai-org/glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -34677,20 +36044,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "accounts/fireworks/models/deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "zai-org/glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -34700,8 +36066,8 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 202800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -34722,41 +36088,31 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2026-02-11", + "last_updated": "2026-02-12", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.15 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" - } - ] - }, - "kimi-for-coding": { - "id": "kimi-for-coding", - "name": "Kimi For Coding", - "display_name": "Kimi For Coding", - "api": "https://api.kimi.com/coding/v1", - "doc": "https://www.kimi.com/coding/docs/en/third-party-agents.html", - "models": [ + }, { - "id": "k2p6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "zai-org/glm-4.6v", + "name": "GLM 4.6V", + "display_name": "GLM 4.6V", "modalities": { "input": [ "text", - "image", - "video" + "video", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 131072, "output": 32768 }, "temperature": true, @@ -34765,60 +36121,54 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04", - "last_updated": "2026-04", + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.3, + "output": 0.9, + "cache_read": 0.055 }, "type": "chat" }, { - "id": "k2p5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "baichuan/baichuan-m2-32b", + "name": "baichuan-m2-32b", + "display_name": "baichuan-m2-32b", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", + "knowledge": "2024-12", + "release_date": "2025-08-13", + "last_updated": "2025-08-13", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.07, + "output": 0.07 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "minimax/minimax-m2.1", + "name": "Minimax M2.1", + "display_name": "Minimax M2.1", "modalities": { "input": [ "text" @@ -34828,14 +36178,13 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -34850,30 +36199,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-11", - "last_updated": "2025-12", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" - } - ] - }, - "moark": { - "id": "moark", - "name": "Moark", - "display_name": "Moark", - "api": "https://moark.com/v1", - "doc": "https://moark.com/docs/openapi/v1#tag/%E6%96%87%E6%9C%AC%E7%94%9F%E6%88%90", - "models": [ + }, { - "id": "GLM-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "minimax/minimax-m2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ "text" @@ -34905,19 +36243,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 3.5, - "output": 14 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "minimax/minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -34928,7 +36266,7 @@ }, "limit": { "context": 204800, - "output": 131072 + "output": 131100 }, "temperature": true, "tool_call": true, @@ -34938,30 +36276,28 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": false, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 2.1, - "output": 8.4 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" - } - ] - }, - "opencode-go": { - "id": "opencode-go", - "name": "OpenCode Go", - "display_name": "OpenCode Go", - "api": "https://opencode.ai/zen/go/v1", - "doc": "https://opencode.ai/docs/zen", - "models": [ + }, { - "id": "minimax-m2.7", + "id": "minimax/minimax-m2.7", "name": "MiniMax M2.7", "display_name": "MiniMax M2.7", "modalities": { @@ -34995,7 +36331,6 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", "release_date": "2026-03-18", "last_updated": "2026-03-18", "cost": { @@ -35006,22 +36341,20 @@ "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "minimax/minimax-m2.5-highspeed", + "name": "MiniMax M2.5 Highspeed", + "display_name": "MiniMax M2.5 Highspeed", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 204800, + "output": 131100 }, "temperature": true, "tool_call": true, @@ -35040,22 +36373,21 @@ ] } }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "attachment": false, + "open_weights": false, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { "input": 0.6, - "output": 3, - "cache_read": 0.1 + "output": 2.4, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "mimo-v2.5-pro", - "name": "MiMo V2.5 Pro", - "display_name": "MiMo V2.5 Pro", + "id": "kwaipilot/kat-coder-pro", + "name": "Kat Coder Pro", + "display_name": "Kat Coder Pro", "modalities": { "input": [ "text" @@ -35065,47 +36397,29 @@ ] }, "limit": { - "context": 1048576, + "context": 256000, "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2026-01-05", + "last_updated": "2026-01-05", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2, - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "nousresearch/hermes-2-pro-llama-3-8b", + "name": "Hermes 2 Pro Llama 3 8B", + "display_name": "Hermes 2 Pro Llama 3 8B", "modalities": { "input": [ "text" @@ -35115,191 +36429,121 @@ ] }, "limit": { - "context": 202752, - "output": 32768 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2024-06-27", + "last_updated": "2024-06-27", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 0.14, + "output": 0.14 }, "type": "chat" }, { - "id": "mimo-v2-omni", - "name": "MiMo V2 Omni", - "display_name": "MiMo V2 Omni", + "id": "sao10K/l3-8b-lunaris", + "name": "Sao10k L3 8B Lunaris\t", + "display_name": "Sao10k L3 8B Lunaris\t", "modalities": { "input": [ - "text", - "image", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 128000 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2024-11-28", + "last_updated": "2024-11-28", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08 + "input": 0.05, + "output": 0.05 }, "type": "chat" }, { - "id": "mimo-v2.5", - "name": "MiMo V2.5", - "display_name": "MiMo V2.5", + "id": "sao10K/l31-70b-euryale-v2.2", + "name": "L31 70B Euryale V2.2", + "display_name": "L31 70B Euryale V2.2", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2024-09-19", + "last_updated": "2024-09-19", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08, - "context_over_200k": { - "input": 0.8, - "output": 4, - "cache_read": 0.16 - } + "input": 1.48, + "output": 1.48 }, "type": "chat" }, { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "sao10K/L3-8B-stheno-v3.2", + "name": "L3 8B Stheno V3.2", + "display_name": "L3 8B Stheno V3.2", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 8192, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "attachment": false, + "open_weights": true, + "release_date": "2024-11-29", + "last_updated": "2024-11-29", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "cache_write": 0.625 + "input": 0.05, + "output": 0.05 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "sao10K/l3-70b-euryale-v2.1", + "name": "L3 70B Euryale V2.1\t", + "display_name": "L3 70B Euryale V2.1\t", "modalities": { "input": [ "text" @@ -35309,92 +36553,63 @@ ] }, "limit": { - "context": 202752, - "output": 32768 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-04-07", - "last_updated": "2026-04-07", + "release_date": "2024-06-18", + "last_updated": "2024-06-18", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 1.48, + "output": 1.48 }, "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "paddlepaddle/paddleocr-vl", + "name": "PaddleOCR-VL", + "display_name": "PaddleOCR-VL", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2025-10-22", + "last_updated": "2025-10-22", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.0028 + "input": 0.02, + "output": 0.02 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "inclusionai/ling-2.6-1t", + "name": "Ling-2.6-1T", + "display_name": "Ling-2.6-1T", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" @@ -35402,41 +36617,27 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "inclusionai/ling-2.6-flash", + "name": "Ling-2.6-flash", + "display_name": "Ling-2.6-flash", "modalities": { "input": [ "text" @@ -35446,42 +36647,29 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", "release_date": "2026-04-24", "last_updated": "2026-04-24", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.0145 + "input": 0.1, + "output": 0.3, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "mistralai/mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -35491,92 +36679,61 @@ ] }, "limit": { - "context": 204800, - "output": 65536 + "context": 60288, + "output": 16000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2024-07-30", + "last_updated": "2024-07-30", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 0.04, + "output": 0.17 }, "type": "chat" }, { - "id": "mimo-v2-pro", - "name": "MiMo V2 Pro", - "display_name": "MiMo V2 Pro", + "id": "qwen/qwen3-vl-235b-a22b-instruct", + "name": "Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen3 VL 235B A22B Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 128000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2, - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0.3, + "output": 1.5 }, "type": "chat" }, { - "id": "qwen3.5-plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "qwen/qwen2.5-vl-72b-instruct", + "name": "Qwen2.5 VL 72B Instruct", + "display_name": "Qwen2.5 VL 72B Instruct", "modalities": { "input": [ "text", @@ -35588,52 +36745,28 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "open_weights": true, + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0.2, - "output": 1.2, - "cache_read": 0.02, - "cache_write": 0.25 + "input": 0.8, + "output": 0.8 }, "type": "chat" - } - ] - }, - "databricks": { - "id": "databricks", - "name": "Databricks", - "display_name": "Databricks", - "api": "https://${DATABRICKS_HOST}/ai-gateway/mlflow/v1", - "doc": "https://docs.databricks.com/aws/en/machine-learning/foundation-models/", - "models": [ + }, { - "id": "databricks-gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "qwen/qwen2.5-7b-instruct", + "name": "Qwen2.5 7B Instruct", + "display_name": "Qwen2.5 7B Instruct", "modalities": { "input": [ "text" @@ -35643,32 +36776,33 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 32000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.072, - "output": 0.28 + "input": 0.07, + "output": 0.07 }, "type": "chat" }, { - "id": "databricks-gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "qwen/qwen3-vl-235b-a22b-thinking", + "name": "Qwen3 VL 235B A22B Thinking", + "display_name": "Qwen3 VL 235B A22B Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -35679,140 +36813,113 @@ "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 0.05, - "output": 0.2 + "input": 0.98, + "output": 3.95 }, "type": "chat" }, { - "id": "databricks-claude-haiku-4-5", - "name": "Claude Haiku 4.5 (latest)", - "display_name": "Claude Haiku 4.5 (latest)", + "id": "qwen/qwen-2.5-72b-instruct", + "name": "Qwen 2.5 72B Instruct", + "display_name": "Qwen 2.5 72B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-10-15", + "last_updated": "2024-10-15", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.38, + "output": 0.4 }, "type": "chat" }, { - "id": "databricks-claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "qwen/qwen3-30b-a3b-fp8", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 40960, + "output": 20000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.09, + "output": 0.45 }, "type": "chat" }, { - "id": "databricks-gemini-3-pro", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "qwen/qwen3.5-122b-a10b", + "name": "Qwen3.5-122B-A10B", + "display_name": "Qwen3.5-122B-A10B", "modalities": { "input": [ "text", "image", - "video", - "audio", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -35820,214 +36927,193 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "open_weights": true, + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.4, + "output": 3.2 }, "type": "chat" }, { - "id": "databricks-gemini-3-1-pro", - "name": "Gemini 3.1 Pro Preview Custom Tools", - "display_name": "Gemini 3.1 Pro Preview Custom Tools", + "id": "qwen/qwen3-omni-30b-a3b-instruct", + "name": "Qwen3 Omni 30B A3B Instruct", + "display_name": "Qwen3 Omni 30B A3B Instruct", "modalities": { "input": [ "text", - "image", "video", "audio", - "pdf" + "image" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 65536, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.25, + "output": 0.97, + "input_audio": 2.2, + "output_audio": 1.788 }, "type": "chat" }, { - "id": "databricks-gpt-5-4-mini", - "name": "GPT-5.4 mini", - "display_name": "GPT-5.4 mini", + "id": "qwen/qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2025-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 2.11, + "output": 8.45 }, "type": "chat" }, { - "id": "databricks-claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "qwen/qwen3.5-397b-a17b", + "name": "Qwen3.5-397B-A17B", + "display_name": "Qwen3.5-397B-A17B", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 262144, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "open_weights": true, + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "databricks-gemini-2-5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "qwen/qwen3-coder-next", + "name": "Qwen3 Coder Next", + "display_name": "Qwen3 Coder Next", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-03", + "last_updated": "2026-02-03", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 0.2, + "output": 1.5 }, "type": "chat" }, { - "id": "databricks-gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "qwen/qwen3-omni-30b-a3b-thinking", + "name": "Qwen3 Omni 30B A3B Thinking", + "display_name": "Qwen3 Omni 30B A3B Thinking", "modalities": { "input": [ "text", + "audio", + "video", "image" ], "output": [ @@ -36035,273 +37121,236 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 65536, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 0.25, + "output": 0.97, + "input_audio": 2.2, + "output_audio": 1.788 }, "type": "chat" }, { - "id": "databricks-gpt-5-4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", - "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, + "attachment": false, + "open_weights": true, + "release_date": "2025-09-10", + "last_updated": "2025-09-10", + "cost": { + "input": 0.15, + "output": 1.5 + }, "type": "chat" }, { - "id": "databricks-gemini-3-1-flash-lite", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "qwen/qwen3-4b-fp8", + "name": "Qwen3 4B", + "display_name": "Qwen3 4B", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 20000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "input": 0.03, + "output": 0.03 }, "type": "chat" }, { - "id": "databricks-gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "qwen/qwen3-235b-a22b-fp8", + "name": "Qwen3 235B A22B", + "display_name": "Qwen3 235B A22B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 40960, + "output": 20000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "databricks-claude-opus-4-1", - "name": "Claude Opus 4.1 (latest)", - "display_name": "Claude Opus 4.1 (latest)", + "id": "qwen/qwen-mt-plus", + "name": "Qwen MT Plus", + "display_name": "Qwen MT Plus", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 16384, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" - }, - { - "id": "databricks-gpt-5-2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 400000, - "output": 128000 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "release_date": "2025-09-03", + "last_updated": "2025-09-03", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.25, + "output": 0.75 }, "type": "chat" }, { - "id": "databricks-gpt-5-5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "qwen/qwen3-vl-30b-a3b-thinking", + "name": "qwen/qwen3-vl-30b-a3b-thinking", + "display_name": "qwen/qwen3-vl-30b-a3b-thinking", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "open_weights": true, + "release_date": "2025-10-11", + "last_updated": "2025-10-11", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 0.2, + "output": 1 }, "type": "chat" }, { - "id": "databricks-gemini-3-flash", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "qwen/qwen3.5-35b-a3b", + "name": "Qwen3.5-35B-A3B", + "display_name": "Qwen3.5-35B-A3B", "modalities": { "input": [ "text", "image", - "video", - "audio", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, @@ -36310,319 +37359,279 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "open_weights": true, + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "context_over_200k": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 - } + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "databricks-claude-opus-4-5", - "name": "Claude Opus 4.5 (latest)", - "display_name": "Claude Opus 4.5 (latest)", + "id": "qwen/qwen3-32b-fp8", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 40960, + "output": 20000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.1, + "output": 0.45 }, "type": "chat" }, { - "id": "databricks-gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "qwen/qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.09, + "output": 0.58 }, "type": "chat" }, { - "id": "databricks-claude-sonnet-4", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "qwen/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.3, + "output": 1.3 }, "type": "chat" }, { - "id": "databricks-gpt-5-1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "qwen/qwen3-vl-8b-instruct", + "name": "qwen/qwen3-vl-8b-instruct", + "display_name": "qwen/qwen3-vl-8b-instruct", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": true, + "release_date": "2025-10-17", + "last_updated": "2025-10-17", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.08, + "output": 0.5 }, "type": "chat" }, { - "id": "databricks-claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "qwen/qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22b Thinking 2507", + "display_name": "Qwen3 235B A22b Thinking 2507", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], "interleaved": true, "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.3, + "output": 3 }, "type": "chat" }, { - "id": "databricks-gemini-2-5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "qwen/qwen3-coder-30b-a3b-instruct", + "name": "Qwen3 Coder 30b A3B Instruct", + "display_name": "Qwen3 Coder 30b A3B Instruct", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 160000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-10-09", + "last_updated": "2025-10-09", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.03, - "input_audio": 1 + "input": 0.07, + "output": 0.27 }, "type": "chat" }, { - "id": "databricks-gpt-5-4-nano", - "name": "GPT-5.4 nano", - "display_name": "GPT-5.4 nano", + "id": "qwen/qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "release_date": "2025-09-10", + "last_updated": "2025-09-10", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 0.15, + "output": 1.5 }, "type": "chat" }, { - "id": "databricks-claude-sonnet-4-5", - "name": "Claude Sonnet 4.5 (latest)", - "display_name": "Claude Sonnet 4.5 (latest)", + "id": "qwen/qwen3.5-27b", + "name": "Qwen3.5-27B", + "display_name": "Qwen3.5-27B", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -36630,66 +37639,64 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": true, + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.3, + "output": 2.4 }, "type": "chat" - } - ] - }, - "io-net": { - "id": "io-net", - "name": "IO.NET", - "display_name": "IO.NET", - "api": "https://api.intelligence.io.solutions/api/v1", - "doc": "https://io.net/docs/guides/intelligence/io-intelligence", - "models": [ + }, { - "id": "Intel/Qwen3-Coder-480B-A35B-Instruct-int4-mixed-ar", - "name": "Qwen 3 Coder 480B", - "display_name": "Qwen 3 Coder 480B", + "id": "qwen/qwen3-vl-30b-a3b-instruct", + "name": "qwen/qwen3-vl-30b-a3b-instruct", + "display_name": "qwen/qwen3-vl-30b-a3b-instruct", "modalities": { "input": [ - "text" + "text", + "video", + "image" ], "output": [ "text" ] }, "limit": { - "context": 106000, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-15", - "last_updated": "2025-01-15", + "release_date": "2025-10-11", + "last_updated": "2025-10-11", "cost": { - "input": 0.22, - "output": 0.95, - "cache_read": 0.11, - "cache_write": 0.44 + "input": 0.2, + "output": 0.7 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "name": "Qwen 3 Next 80B Instruct", - "display_name": "Qwen 3 Next 80B Instruct", + "id": "qwen/qwen3-8b-fp8", + "name": "Qwen3 8B", + "display_name": "Qwen3 8B", "modalities": { "input": [ "text" @@ -36699,34 +37706,33 @@ ] }, "limit": { - "context": 262144, - "output": 4096 + "context": 128000, + "output": 20000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-10", - "last_updated": "2025-01-10", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.1, - "output": 0.8, - "cache_read": 0.05, - "cache_write": 0.2 + "input": 0.035, + "output": 0.138 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen 3 235B Thinking", - "display_name": "Qwen 3 235B Thinking", + "id": "google/gemma-4-26b-a4b-it", + "name": "Gemma 4 26B A4B", + "display_name": "Gemma 4 26B A4B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -36734,7 +37740,7 @@ }, "limit": { "context": 262144, - "output": 4096 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -36742,34 +37748,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.11, - "output": 0.6, - "cache_read": 0.055, - "cache_write": 0.22 + "input": 0.13, + "output": 0.4 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-32B-Instruct", - "name": "Qwen 2.5 VL 32B Instruct", - "display_name": "Qwen 2.5 VL 32B Instruct", + "id": "google/gemma-3-27b-it", + "name": "Gemma 3 27B", + "display_name": "Gemma 3 27B", "modalities": { "input": [ "text", @@ -36780,139 +37772,124 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 98304, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0.05, - "output": 0.22, - "cache_read": 0.025, - "cache_write": 0.1 + "input": 0.119, + "output": 0.2 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "google/gemma-4-31b-it", + "name": "Gemma 4 31B", + "display_name": "Gemma 4 31B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-11-15", - "last_updated": "2024-11-15", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.4, - "output": 1.75, - "cache_read": 0.2, - "cache_write": 0.8 + "input": 0.14, + "output": 0.4 }, "type": "chat" }, { - "id": "mistralai/Magistral-Small-2506", - "name": "Magistral Small 2506", - "display_name": "Magistral Small 2506", + "id": "google/gemma-3-12b-it", + "name": "Gemma 3 12B", + "display_name": "Gemma 3 12B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "attachment": true, + "open_weights": true, + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 0.5, - "output": 1.5, - "cache_read": 0.25, - "cache_write": 1 + "input": 0.05, + "output": 0.1 }, "type": "chat" }, { - "id": "mistralai/Mistral-Large-Instruct-2411", - "name": "Mistral Large Instruct 2411", - "display_name": "Mistral Large Instruct 2411", + "id": "microsoft/wizardlm-2-8x22b", + "name": "Wizardlm 2 8x22B", + "display_name": "Wizardlm 2 8x22B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 65535, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "open_weights": true, + "release_date": "2024-04-24", + "last_updated": "2024-04-24", "cost": { - "input": 2, - "output": 6, - "cache_read": 1, - "cache_write": 4 + "input": 0.62, + "output": 0.62 }, "type": "chat" }, { - "id": "mistralai/Mistral-Nemo-Instruct-2407", - "name": "Mistral Nemo Instruct 2407", - "display_name": "Mistral Nemo Instruct 2407", + "id": "gryphe/mythomax-l2-13b", + "name": "Mythomax L2 13B", + "display_name": "Mythomax L2 13B", "modalities": { "input": [ "text" @@ -36922,31 +37899,28 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 4096, + "output": 3200 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-05", - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "release_date": "2024-04-25", + "last_updated": "2024-04-25", "cost": { - "input": 0.02, - "output": 0.04, - "cache_read": 0.01, - "cache_write": 0.04 + "input": 0.09, + "output": 0.09 }, "type": "chat" }, { - "id": "mistralai/Devstral-Small-2505", - "name": "Devstral Small 2505", - "display_name": "Devstral Small 2505", + "id": "deepseek/deepseek-r1-0528-qwen3-8b", + "name": "DeepSeek R1 0528 Qwen3 8B", + "display_name": "DeepSeek R1 0528 Qwen3 8B", "modalities": { "input": [ "text" @@ -36957,30 +37931,28 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", + "open_weights": true, + "release_date": "2025-05-29", + "last_updated": "2025-05-29", "cost": { - "input": 0.05, - "output": 0.22, - "cache_read": 0.025, - "cache_write": 0.1 + "input": 0.06, + "output": 0.09 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "deepseek/deepseek-prover-v2-671b", + "name": "Deepseek Prover V2 671B", + "display_name": "Deepseek Prover V2 671B", "modalities": { "input": [ "text" @@ -36990,66 +37962,60 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 160000, + "output": 160000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-04-30", + "last_updated": "2025-04-30", "cost": { - "input": 0.13, - "output": 0.38, - "cache_read": 0.065, - "cache_write": 0.26 + "input": 0.7, + "output": 2.5 }, "type": "chat" }, { - "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", - "name": "Llama 4 Maverick 17B 128E Instruct", - "display_name": "Llama 4 Maverick 17B 128E Instruct", + "id": "deepseek/deepseek-r1-turbo", + "name": "DeepSeek R1 (Turbo)\t", + "display_name": "DeepSeek R1 (Turbo)\t", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 430000, - "output": 4096 + "context": 64000, + "output": 16000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-15", - "last_updated": "2025-01-15", + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075, - "cache_write": 0.3 + "input": 0.7, + "output": 2.5 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.2-90B-Vision-Instruct", - "name": "Llama 3.2 90B Vision Instruct", - "display_name": "Llama 3.2 90B Vision Instruct", + "id": "deepseek/deepseek-ocr-2", + "name": "deepseek/deepseek-ocr-2", + "display_name": "deepseek/deepseek-ocr-2", "modalities": { "input": [ "text", @@ -37060,31 +38026,27 @@ ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.35, - "output": 0.4, - "cache_read": 0.175, - "cache_write": 0.7 + "input": 0.03, + "output": 0.03 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "deepseek/deepseek-v3.2-exp", + "name": "Deepseek V3.2 Exp", + "display_name": "Deepseek V3.2 Exp", "modalities": { "input": [ "text" @@ -37094,8 +38056,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -37103,34 +38065,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-28", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 2, - "output": 8.75, - "cache_read": 1, - "cache_write": 4 + "input": 0.27, + "output": 0.41 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT-OSS 20B", - "display_name": "GPT-OSS 20B", + "id": "deepseek/deepseek-r1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ "text" @@ -37140,36 +38088,42 @@ ] }, "limit": { - "context": 64000, - "output": 4096 + "context": 163840, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.03, - "output": 0.14, - "cache_read": 0.015, - "cache_write": 0.06 + "input": 0.7, + "output": 2.5, + "cache_read": 0.35 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT-OSS 120B", - "display_name": "GPT-OSS 120B", + "id": "deepseek/deepseek-v3-0324", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ "text" @@ -37179,36 +38133,30 @@ ] }, "limit": { - "context": 131072, - "output": 4096 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2024-07", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0.04, - "output": 0.4, - "cache_read": 0.02, - "cache_write": 0.08 + "input": 0.27, + "output": 1.12, + "cache_read": 0.135 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "deepseek/deepseek-v3.2", + "name": "Deepseek V3.2", + "display_name": "Deepseek V3.2", "modalities": { "input": [ "text" @@ -37218,8 +38166,8 @@ ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -37239,65 +38187,52 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "open_weights": true, + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.55, - "output": 2.25, - "cache_read": 0.275, - "cache_write": 1.1 + "input": 0.269, + "output": 0.4, + "cache_read": 0.1345 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "deepseek/deepseek-ocr", + "name": "DeepSeek-OCR", + "display_name": "DeepSeek-OCR", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-09-05", - "last_updated": "2024-09-05", + "attachment": true, + "open_weights": true, + "release_date": "2025-10-24", + "last_updated": "2025-10-24", "cost": { - "input": 0.39, - "output": 1.9, - "cache_read": 0.195, - "cache_write": 0.78 + "input": 0.03, + "output": 0.03 }, "type": "chat" - } - ] - }, - "alibaba-cn": { - "id": "alibaba-cn", - "name": "alibaba-cn", - "display_name": "alibaba-cn", - "api": "https://dashscope.aliyuncs.com/compatible-mode/v1", - "doc": "https://www.alibabacloud.com/help/en/model-studio/models", - "models": [ + }, { - "id": "qwen3-235b-a22b", - "name": "Qwen3 235B A22B", - "display_name": "Qwen3 235B A22B", + "id": "deepseek/deepseek-v3-turbo", + "name": "DeepSeek V3 (Turbo)\t", + "display_name": "DeepSeek V3 (Turbo)\t", "modalities": { "input": [ "text" @@ -37307,47 +38242,28 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 64000, + "output": 16000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "cost": { - "input": 0.287, - "output": 1.147, - "reasoning": 2.868 + "input": 0.4, + "output": 1.3 }, "type": "chat" }, { - "id": "qwen-plus-character", - "name": "Qwen Plus Character", - "display_name": "Qwen Plus Character", + "id": "deepseek/deepseek-r1-distill-qwen-14b", + "name": "DeepSeek R1 Distill Qwen 14B", + "display_name": "DeepSeek R1 Distill Qwen 14B", "modalities": { "input": [ "text" @@ -37358,28 +38274,27 @@ }, "limit": { "context": 32768, - "output": 4096 + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01", - "last_updated": "2024-01", + "open_weights": true, + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.115, - "output": 0.287 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "qwen2-5-math-7b-instruct", - "name": "Qwen2.5-Math 7B Instruct", - "display_name": "Qwen2.5-Math 7B Instruct", + "id": "deepseek/deepseek-v3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text" @@ -37389,75 +38304,67 @@ ] }, "limit": { - "context": 4096, - "output": 3072 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.144, - "output": 0.287 + "input": 0.27, + "output": 1, + "cache_read": 0.135 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Moonshot Kimi K2.5", - "display_name": "Moonshot Kimi K2.5", + "id": "deepseek/deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill LLama 70B", + "display_name": "DeepSeek R1 Distill LLama 70B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0.574, - "output": 2.411 + "input": 0.8, + "output": 0.8 }, "type": "chat" }, { - "id": "qwen-doc-turbo", - "name": "Qwen Doc Turbo", - "display_name": "Qwen Doc Turbo", + "id": "deepseek/deepseek-r1-distill-qwen-32b", + "name": "DeepSeek R1 Distill Qwen 32B", + "display_name": "DeepSeek R1 Distill Qwen 32B", "modalities": { "input": [ "text" @@ -37467,196 +38374,157 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 64000, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01", - "last_updated": "2024-01", + "open_weights": true, + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.087, - "output": 0.144 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen-vl-ocr", - "name": "Qwen Vl Ocr", - "display_name": "Qwen Vl Ocr", + "id": "deepseek/deepseek-v3.1-terminus", + "name": "Deepseek V3.1 Terminus", + "display_name": "Deepseek V3.1 Terminus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 34096, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-10-28", - "last_updated": "2025-04-13", + "open_weights": true, + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 0.717, - "output": 0.717 + "input": 0.27, + "output": 1, + "cache_read": 0.135 }, "type": "chat" }, { - "id": "qwen-omni-turbo-realtime", - "name": "Qwen-Omni Turbo Realtime", - "display_name": "Qwen-Omni Turbo Realtime", + "id": "minimaxai/minimax-m1-80k", + "name": "MiniMax M1", + "display_name": "MiniMax M1", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 1000000, + "output": 40000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-08", - "last_updated": "2025-05-08", + "open_weights": true, + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.23, - "output": 0.918, - "input_audio": 3.584, - "output_audio": 7.168 + "input": 0.55, + "output": 2.2 }, "type": "chat" }, { - "id": "qwen3-8b", - "name": "Qwen3 8B", - "display_name": "Qwen3 8B", + "id": "meta-llama/llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick Instruct", + "display_name": "Llama 4 Maverick Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 1048576, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "release_date": "2025-04-06", + "last_updated": "2025-04-06", "cost": { - "input": 0.072, - "output": 0.287, - "reasoning": 0.717 + "input": 0.27, + "output": 0.85 }, "type": "chat" }, { - "id": "qwen3.5-397b-a17b", - "name": "Qwen3.5 397B-A17B", - "display_name": "Qwen3.5 397B-A17B", + "id": "meta-llama/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout Instruct", + "display_name": "Llama 4 Scout Instruct", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "release_date": "2025-04-06", + "last_updated": "2025-04-06", "cost": { - "input": 0.43, - "output": 2.58, - "reasoning": 2.58 + "input": 0.18, + "output": 0.59 }, "type": "chat" }, { - "id": "qwen-math-turbo", - "name": "Qwen Math Turbo", - "display_name": "Qwen Math Turbo", + "id": "meta-llama/llama-3-70b-instruct", + "name": "Llama3 70B Instruct", + "display_name": "Llama3 70B Instruct", "modalities": { "input": [ "text" @@ -37666,29 +38534,28 @@ ] }, "limit": { - "context": 4096, - "output": 3072 + "context": 8192, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-09-19", - "last_updated": "2024-09-19", + "open_weights": true, + "release_date": "2024-04-25", + "last_updated": "2024-04-25", "cost": { - "input": 0.287, - "output": 0.861 + "input": 0.51, + "output": 0.74 }, "type": "chat" }, { - "id": "qwq-plus", - "name": "QwQ Plus", - "display_name": "QwQ Plus", + "id": "meta-llama/llama-3-8b-instruct", + "name": "Llama 3 8B Instruct", + "display_name": "Llama 3 8B Instruct", "modalities": { "input": [ "text" @@ -37698,56 +38565,31 @@ ] }, "limit": { - "context": 131072, + "context": 8192, "output": 8192 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 32768, - "min": 0, - "max": 32768 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-03-05", - "last_updated": "2025-03-05", + "open_weights": true, + "release_date": "2024-04-25", + "last_updated": "2024-04-25", "cost": { - "input": 0.23, - "output": 0.574 + "input": 0.04, + "output": 0.04 }, "type": "chat" }, { - "id": "qwen-vl-plus", - "name": "Qwen-VL Plus", - "display_name": "Qwen-VL Plus", + "id": "meta-llama/llama-3.3-70b-instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -37755,7 +38597,7 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 120000 }, "temperature": true, "tool_call": true, @@ -37763,20 +38605,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", - "last_updated": "2025-08-15", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-07", + "last_updated": "2024-12-07", "cost": { - "input": 0.115, - "output": 0.287 + "input": 0.135, + "output": 0.4 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "meta-llama/llama-3.2-3b-instruct", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ "text" @@ -37786,40 +38628,28 @@ ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 32768, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "open_weights": true, + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 0.86, - "output": 3.15 + "input": 0.03, + "output": 0.05 }, "type": "chat" }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "meta-llama/llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ "text" @@ -37829,34 +38659,28 @@ ] }, "limit": { - "context": 32768, + "context": 16384, "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "release_date": "2024-07-24", + "last_updated": "2024-07-24", "cost": { - "input": 0.287, - "output": 0.861 + "input": 0.02, + "output": 0.05 }, "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "xiaomimimo/mimo-v2-flash", + "name": "XiaomiMiMo/MiMo-V2-Flash", + "display_name": "XiaomiMiMo/MiMo-V2-Flash", "modalities": { "input": [ "text" @@ -37866,58 +38690,44 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "knowledge": "2024-12", + "release_date": "2025-12-19", + "last_updated": "2025-12-19", "cost": { - "input": 0.287, - "output": 1.147, - "reasoning": 2.868 + "input": 0.1, + "output": 0.3, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "baidu/ernie-4.5-vl-28b-a3b-thinking", + "name": "ERNIE-4.5-VL-28B-A3B-Thinking", + "display_name": "ERNIE-4.5-VL-28B-A3B-Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -37925,69 +38735,53 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2025-11-26", + "last_updated": "2025-11-26", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.39, + "output": 0.39 }, "type": "chat" }, { - "id": "qwen-max", - "name": "Qwen Max", - "display_name": "Qwen Max", + "id": "baidu/ernie-4.5-vl-424b-a47b", + "name": "ERNIE 4.5 VL 424B A47B", + "display_name": "ERNIE 4.5 VL 424B A47B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 123000, + "output": 16000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false - }, - "search": { "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-04-03", - "last_updated": "2025-01-25", + "attachment": true, + "open_weights": true, + "release_date": "2025-06-30", + "last_updated": "2025-06-30", "cost": { - "input": 0.345, - "output": 1.377 + "input": 0.42, + "output": 1.25 }, "type": "chat" }, { - "id": "qwen-plus", - "name": "Qwen Plus", - "display_name": "Qwen Plus", + "id": "baidu/ernie-4.5-21B-a3b-thinking", + "name": "ERNIE-4.5-21B-A3B-Thinking", + "display_name": "ERNIE-4.5-21B-A3B-Thinking", "modalities": { "input": [ "text" @@ -37997,68 +38791,41 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 131072, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", - "last_updated": "2025-09-11", + "open_weights": true, + "knowledge": "2025-03", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 0.115, - "output": 0.287, - "reasoning": 1.147 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "qwen-omni-turbo", - "name": "Qwen-Omni Turbo", - "display_name": "Qwen-Omni Turbo", + "id": "baidu/ernie-4.5-21B-a3b", + "name": "ERNIE 4.5 21B A3B", + "display_name": "ERNIE 4.5 21B A3B", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 120000, + "output": 8000 }, "temperature": true, "tool_call": true, @@ -38066,22 +38833,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-19", - "last_updated": "2025-03-26", + "open_weights": true, + "knowledge": "2025-03", + "release_date": "2025-06-30", + "last_updated": "2025-06-30", "cost": { - "input": 0.058, - "output": 0.23, - "input_audio": 3.584, - "output_audio": 7.168 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "qwen-flash", - "name": "Qwen Flash", - "display_name": "Qwen Flash", + "id": "baidu/ernie-4.5-300b-a47b-paddle", + "name": "ERNIE 4.5 300B A47B", + "display_name": "ERNIE 4.5 300B A47B", "modalities": { "input": [ "text" @@ -38091,52 +38856,28 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 123000, + "output": 12000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": true, + "release_date": "2025-06-30", + "last_updated": "2025-06-30", "cost": { - "input": 0.022, - "output": 0.216 + "input": 0.28, + "output": 1.1 }, "type": "chat" }, { - "id": "qwen2-5-vl-7b-instruct", - "name": "Qwen2.5-VL 7B Instruct", - "display_name": "Qwen2.5-VL 7B Instruct", + "id": "baidu/ernie-4.5-vl-28b-a3b", + "name": "ERNIE 4.5 VL 28B A3B", + "display_name": "ERNIE 4.5 VL 28B A3B", "modalities": { "input": [ "text", @@ -38147,40 +38888,42 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 30000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "release_date": "2025-06-30", + "last_updated": "2025-06-30", "cost": { - "input": 0.287, - "output": 0.717 + "input": 1.4, + "output": 5.6 }, "type": "chat" }, { - "id": "deepseek-r1", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "moonshotai/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -38199,33 +38942,33 @@ ] } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.574, - "output": 2.294 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "qwen3.5-flash", - "name": "Qwen3.5 Flash", - "display_name": "Qwen3.5 Flash", + "id": "deepseek/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, @@ -38244,35 +38987,33 @@ ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-23", - "last_updated": "2026-02-23", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.172, - "output": 1.72, - "reasoning": 1.72 + "input": 1.69, + "output": 3.38, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "deepseek/deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, @@ -38292,65 +39033,82 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.276, - "output": 1.651, - "cache_read": 0.028, - "cache_write": 0.344 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" - }, + } + ] + }, + "digitalocean": { + "id": "digitalocean", + "name": "DigitalOcean", + "display_name": "DigitalOcean", + "api": "https://inference.do-ai.run/v1", + "doc": "https://docs.digitalocean.com/products/gradient-ai-platform/details/models/", + "models": [ { - "id": "qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "openai-gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-30", "cost": { - "input": 0.861, - "output": 3.441 + "input": 5, + "output": 30, + "cache_read": 0.5, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + } }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "openai-o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" @@ -38360,168 +39118,146 @@ ] }, "limit": { - "context": 202752, - "output": 128000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-14", - "last_updated": "2026-04-14", + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 0.87, - "output": 3.48, - "cache_read": 0.17 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "qwen3-omni-flash", - "name": "Qwen3-Omni Flash", - "display_name": "Qwen3-Omni Flash", + "id": "bge-reranker-v2-m3", + "name": "BGE Reranker v2 M3", + "display_name": "BGE Reranker v2 M3", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 8192, + "output": 1 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "open_weights": true, + "release_date": "2024-03-12", + "last_updated": "2026-04-30", "cost": { - "input": 0.058, - "output": 0.23, - "input_audio": 3.584, - "output_audio": 7.168 + "input": 0.01, + "output": 0 }, - "type": "chat" + "type": "rerank" }, { - "id": "deepseek-v3-1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "openai-gpt-5-mini", + "name": "GPT-5 mini", + "display_name": "GPT-5 mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.574, - "output": 1.721 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "qwen2-5-72b-instruct", - "name": "Qwen2.5 72B Instruct", - "display_name": "Qwen2.5 72B Instruct", + "id": "openai-o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.574, - "output": 1.721 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b", - "name": "Qwen3-VL 235B-A22B", - "display_name": "Qwen3-VL 235B-A22B", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 262144, "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -38540,197 +39276,191 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-04-16", "cost": { - "input": 0.286705, - "output": 1.14682, - "reasoning": 2.867051 + "input": 0.5, + "output": 2.7 }, "type": "chat" }, { - "id": "qwen-math-plus", - "name": "Qwen Math Plus", - "display_name": "Qwen Math Plus", + "id": "anthropic-claude-4.5-haiku", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 3072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-08-16", - "last_updated": "2024-09-19", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.574, - "output": 1.721 + "input": 1, + "output": 5, + "cache_read": 1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "qwen2-5-coder-32b-instruct", - "name": "Qwen2.5-Coder 32B Instruct", - "display_name": "Qwen2.5-Coder 32B Instruct", + "id": "openai-gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-11", - "last_updated": "2024-11", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.287, - "output": 0.861 + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "qwen3-asr-flash", - "name": "Qwen3-ASR Flash", - "display_name": "Qwen3-ASR Flash", + "id": "llama3.3-70b-instruct", + "name": "Llama 3.3 Instruct 70B", + "display_name": "Llama 3.3 Instruct 70B", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 53248, - "output": 4096 + "context": 128000, + "output": 128000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-08", - "last_updated": "2025-09-08", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.032, - "output": 0.032 + "input": 0.65, + "output": 0.65 }, "type": "chat" }, { - "id": "qwen-deep-research", - "name": "Qwen Deep Research", - "display_name": "Qwen Deep Research", + "id": "nemotron-3-nano-omni", + "name": "Nemotron Nano 3 Omni", + "display_name": "Nemotron Nano 3 Omni", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01", - "last_updated": "2024-01", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-28", + "last_updated": "2026-04-30", "cost": { - "input": 7.742, - "output": 23.367 + "input": 0.5, + "output": 0.9 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "nemotron-nano-12b-v2-vl", + "name": "Nemotron Nano 12B v2 VL", + "display_name": "Nemotron Nano 12B v2 VL", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", + "knowledge": "2024-10", + "release_date": "2025-12-01", + "last_updated": "2026-04-30", "cost": { - "input": 0.144, - "output": 1.434 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "qwen-mt-plus", - "name": "Qwen Mt Plus", - "display_name": "Qwen Mt Plus", + "id": "mistral-7b-instruct-v0.3", + "name": "Mistral 7B Instruct v0.3", + "display_name": "Mistral 7B Instruct v0.3", "modalities": { "input": [ "text" @@ -38740,29 +39470,24 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01", - "last_updated": "2025-01", - "cost": { - "input": 0.259, - "output": 0.775 - }, + "open_weights": true, + "release_date": "2024-05-22", + "last_updated": "2024-05-22", "type": "chat" }, { - "id": "deepseek-r1-distill-qwen-32b", - "name": "DeepSeek R1 Distill Qwen 32B", - "display_name": "DeepSeek R1 Distill Qwen 32B", + "id": "nemotron-3-nano-30b", + "name": "Nemotron 3 Nano 30B A3B", + "display_name": "Nemotron 3 Nano 30B A3B", "modalities": { "input": [ "text" @@ -38772,8 +39497,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -38782,52 +39507,52 @@ "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0.287, - "output": 0.861 - }, + "open_weights": true, + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "type": "chat" }, { - "id": "qwen-vl-max", - "name": "Qwen-VL Max", - "display_name": "Qwen-VL Max", + "id": "anthropic-claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-04-08", - "last_updated": "2025-08-13", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.23, - "output": 0.574 + "input": 1, + "output": 5, + "cache_read": 1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "qwen3-coder-flash", - "name": "Qwen3 Coder Flash", - "display_name": "Qwen3 Coder Flash", + "id": "all-mini-lm-l6-v2", + "name": "All-MiniLM-L6-v2", + "display_name": "All-MiniLM-L6-v2", "modalities": { "input": [ "text" @@ -38837,157 +39562,178 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 256, + "output": 384 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": true, + "release_date": "2021-08-30", + "last_updated": "2026-04-16", "cost": { - "input": 0.144, - "output": 0.574 + "input": 0.009, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-r1-distill-qwen-7b", - "name": "DeepSeek R1 Distill Qwen 7B", - "display_name": "DeepSeek R1 Distill Qwen 7B", + "id": "openai-gpt-image-1", + "name": "GPT Image 1", + "display_name": "GPT Image 1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-04-24", + "last_updated": "2025-04-24", "cost": { - "input": 0.072, - "output": 0.144 + "input": 5, + "output": 40, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "qwen2-5-7b-instruct", - "name": "Qwen2.5 7B Instruct", - "display_name": "Qwen2.5 7B Instruct", + "id": "qwen3-tts-voicedesign", + "name": "Qwen3 TTS VoiceDesign", + "display_name": "Qwen3 TTS VoiceDesign", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32768, + "output": 1 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", - "cost": { - "input": 0.072, - "output": 0.144 - }, + "release_date": "2026-04-21", + "last_updated": "2026-04-30", "type": "chat" }, { - "id": "qwen2-5-14b-instruct", - "name": "Qwen2.5 14B Instruct", - "display_name": "Qwen2.5 14B Instruct", + "id": "openai-gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.144, - "output": 0.431 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "tongyi-intent-detect-v3", - "name": "Tongyi Intent Detect V3", - "display_name": "Tongyi Intent Detect V3", + "id": "anthropic-claude-4.5-sonnet", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1024 + "context": 1000000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01", - "last_updated": "2024-01", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.058, - "output": 0.144 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.3, + "cache_write": 3.75, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.3, + "cache_write": 3.75 + } }, "type": "chat" }, { - "id": "qwq-32b", - "name": "QwQ 32B", - "display_name": "QwQ 32B", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -38997,8 +39743,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, @@ -39019,127 +39765,136 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-12", - "last_updated": "2024-12", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.287, - "output": 0.861 + "input": 1.74, + "output": 3.48 }, "type": "chat" }, { - "id": "moonshot-kimi-k2-instruct", - "name": "Moonshot Kimi K2 Instruct", - "display_name": "Moonshot Kimi K2 Instruct", + "id": "anthropic-claude-4.1-opus", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.574, - "output": 2.294 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "qwen2-5-32b-instruct", - "name": "Qwen2.5 32B Instruct", - "display_name": "Qwen2.5 32B Instruct", + "id": "openai-gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, + "attachment": true, + "open_weights": false, "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.287, - "output": 0.861 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "openai-gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.144, - "output": 0.574 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen3-omni-flash-realtime", - "name": "Qwen3-Omni Flash Realtime", - "display_name": "Qwen3-Omni Flash Realtime", + "id": "mistral-nemo-instruct-2407", + "name": "Mistral Nemo Instruct", + "display_name": "Mistral Nemo Instruct", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 65536, + "context": 128000, "output": 16384 }, "temperature": true, @@ -39148,35 +39903,30 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "open_weights": true, + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.23, - "output": 0.918, - "input_audio": 3.584, - "output_audio": 7.168 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Moonshot Kimi K2.6", - "display_name": "Moonshot Kimi K2.6", + "id": "nvidia-nemotron-3-super-120b", + "name": "Nemotron-3-Super-120B", + "display_name": "Nemotron-3-Super-120B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 256000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -39184,44 +39934,32 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "knowledge": "2026-02", + "release_date": "2026-03-11", + "last_updated": "2026-04-16", "cost": { - "input": 0.929, - "output": 3.858 + "input": 0.3, + "output": 0.65 }, "type": "chat" }, { - "id": "qwen3-vl-30b-a3b", - "name": "Qwen3-VL 30B-A3B", - "display_name": "Qwen3-VL 30B-A3B", + "id": "arcee-trinity-large-thinking", + "name": "Trinity Large Thinking", + "display_name": "Trinity Large Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 256000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -39229,33 +39967,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-16", "cost": { - "input": 0.108, - "output": 0.431, - "reasoning": 1.076 + "input": 0.25, + "output": 0.9, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "qwen3-vl-plus", - "name": "Qwen3 VL Plus", - "display_name": "Qwen3 VL Plus", + "id": "anthropic-claude-3.5-sonnet", + "name": "Claude 3.5 Sonnet", + "display_name": "Claude 3.5 Sonnet", "modalities": { "input": [ "text", @@ -39266,142 +39992,136 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 200000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "knowledge": "2024-04", + "release_date": "2024-06-20", + "last_updated": "2024-10-22", "cost": { - "input": 0.143353, - "output": 1.433525, - "reasoning": 4.300576 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "deepseek-v3-2-exp", - "name": "DeepSeek V3.2 Exp", - "display_name": "DeepSeek V3.2 Exp", + "id": "openai-gpt-5.2-pro", + "name": "GPT-5.2 pro", + "display_name": "GPT-5.2 pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.287, - "output": 0.431 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "Qwen3-Coder 480B-A35B Instruct", - "display_name": "Qwen3-Coder 480B-A35B Instruct", + "id": "openai-gpt-5.4-nano", + "name": "GPT-5.4 nano", + "display_name": "GPT-5.4 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.861, - "output": 3.441 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "deepseek-r1-distill-qwen-1-5b", - "name": "DeepSeek R1 Distill Qwen 1.5B", - "display_name": "DeepSeek R1 Distill Qwen 1.5B", + "id": "openai-gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0, - "output": 0 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3-Coder 30B-A3B Instruct", - "display_name": "Qwen3-Coder 30B-A3B Instruct", + "id": "deepseek-v3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ "text" @@ -39411,8 +40131,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 163840, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -39421,19 +40141,15 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", - "cost": { - "input": 0.216, - "output": 0.861 - }, + "knowledge": "2024-07", + "release_date": "2024-12-26", + "last_updated": "2025-03-24", "type": "chat" }, { - "id": "qwen2-5-coder-7b-instruct", - "name": "Qwen2.5-Coder 7B Instruct", - "display_name": "Qwen2.5-Coder 7B Instruct", + "id": "minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -39443,29 +40159,35 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 204800, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-11", - "last_updated": "2024-11", + "knowledge": "2025-08", + "release_date": "2026-02-12", + "last_updated": "2026-04-16", "cost": { - "input": 0.144, - "output": 0.287 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "qwen-turbo", - "name": "Qwen Turbo", - "display_name": "Qwen Turbo", + "id": "qwen3.5-397b-a17b", + "name": "Qwen 3.5 397B A17B", + "display_name": "Qwen 3.5 397B A17B", "modalities": { "input": [ "text" @@ -39475,19 +40197,14 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 81920 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -39500,92 +40217,107 @@ ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-11-01", - "last_updated": "2025-07-15", + "open_weights": true, + "release_date": "2026-02-15", + "last_updated": "2026-04-30", "cost": { - "input": 0.044, - "output": 0.087, - "reasoning": 0.431 + "input": 0.55, + "output": 3.5 }, "type": "chat" }, { - "id": "qwen-mt-turbo", - "name": "Qwen Mt Turbo", - "display_name": "Qwen Mt Turbo", + "id": "ministral-3-8b-instruct-2512", + "name": "Ministral 3 8B", + "display_name": "Ministral 3 8B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-12-15", + "last_updated": "2025-12-15", + "type": "chat" + }, + { + "id": "openai-gpt-image-2", + "name": "GPT Image 2", + "display_name": "GPT Image 2", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01", - "last_updated": "2025-01", - "cost": { - "input": 0.101, - "output": 0.28 - }, + "release_date": "2025-04-24", + "last_updated": "2025-04-24", "type": "chat" }, { - "id": "qwen2-5-math-72b-instruct", - "name": "Qwen2.5-Math 72B Instruct", - "display_name": "Qwen2.5-Math 72B Instruct", + "id": "stable-diffusion-3.5-large", + "name": "Stable Diffusion 3.5 Large", + "display_name": "Stable Diffusion 3.5 Large", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 4096, - "output": 3072 + "context": 256, + "output": 1 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "release_date": "2024-10-22", + "last_updated": "2026-04-30", "cost": { - "input": 0.574, - "output": 1.721 + "input": 0.08, + "output": 0 }, "type": "chat" }, { - "id": "qwen3.6-max-preview", - "name": "Qwen3.6 Max Preview", - "display_name": "Qwen3.6 Max Preview", + "id": "qwen3-embedding-0.6b", + "name": "Qwen3 Embedding 0.6B", + "display_name": "Qwen3 Embedding 0.6B", "modalities": { "input": [ "text" @@ -39595,125 +40327,98 @@ ] }, "limit": { - "context": 245800, - "output": 65536 + "context": 8000, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-20", - "last_updated": "2026-04-21", + "open_weights": true, + "release_date": "2025-06-03", + "last_updated": "2026-04-16", "cost": { - "input": 1.32, - "output": 7.9, - "cache_read": 0.132 + "input": 0.04, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "qwen2-5-omni-7b", - "name": "Qwen2.5-Omni 7B", - "display_name": "Qwen2.5-Omni 7B", + "id": "openai-gpt-5-nano", + "name": "GPT-5 nano", + "display_name": "GPT-5 nano", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-12", - "last_updated": "2024-12", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.087, - "output": 0.345, - "input_audio": 5.448 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "qwen3.5-plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "openai-gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.573, - "output": 3.44, - "reasoning": 3.44 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "deepseek-r1-distill-qwen-14b", - "name": "DeepSeek R1 Distill Qwen 14B", - "display_name": "DeepSeek R1 Distill Qwen 14B", + "id": "deepseek-3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -39723,8 +40428,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -39732,20 +40437,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-12-02", + "last_updated": "2026-04-30", "cost": { - "input": 0.144, - "output": 0.431 + "input": 0.5, + "output": 1.6 }, "type": "chat" }, { - "id": "qwen2-5-vl-72b-instruct", - "name": "Qwen2.5-VL 72B Instruct", - "display_name": "Qwen2.5-VL 72B Instruct", + "id": "openai-gpt-5.4-pro", + "name": "GPT-5.4 pro", + "display_name": "GPT-5.4 pro", "modalities": { "input": [ "text", @@ -39756,29 +40473,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 2.294, - "output": 6.881 + "input": 30, + "output": 180 }, "type": "chat" }, { - "id": "deepseek-v3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "qwen3-coder-flash", + "name": "Qwen3 Coder Flash", + "display_name": "Qwen3 Coder Flash", "modalities": { "input": [ "text" @@ -39788,8 +40506,8 @@ ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -39797,19 +40515,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2026-04-30", "cost": { - "input": 0.287, - "output": 1.147 + "input": 0.45, + "output": 1.7 }, "type": "chat" }, { - "id": "deepseek-r1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", + "id": "openai-gpt-oss-20b", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ "text" @@ -39820,7 +40539,7 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -39828,31 +40547,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2025-08-05", + "last_updated": "2026-04-16", "cost": { - "input": 0.574, - "output": 2.294 + "input": 0.05, + "output": 0.45 }, "type": "chat" }, { - "id": "qvq-max", - "name": "QVQ Max", - "display_name": "QVQ Max", + "id": "openai-gpt-5.4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", "modalities": { "input": [ "text", @@ -39863,73 +40572,112 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 1.147, - "output": 4.588 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Moonshot Kimi K2 Thinking", - "display_name": "Moonshot Kimi K2 Thinking", + "id": "anthropic-claude-opus-4.6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.574, - "output": 2.294 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "tiers": [ + { + "input": 10, + "output": 37.5, + "cache_read": 0.5, + "cache_write": 6.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 0.5, + "cache_write": 6.25 + } }, "type": "chat" }, { - "id": "qwen3-14b", - "name": "Qwen3 14B", - "display_name": "Qwen3 14B", + "id": "alibaba-qwen3-32b", + "name": "Qwen3-32B", + "display_name": "Qwen3-32B", "modalities": { "input": [ "text" @@ -39939,79 +40687,117 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 131000, + "output": 40960 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "release_date": "2025-04-30", + "last_updated": "2026-04-16", "cost": { - "input": 0.144, - "output": 0.574, - "reasoning": 1.434 + "input": 0.25, + "output": 0.55 }, "type": "chat" }, { - "id": "deepseek-r1-distill-llama-8b", - "name": "DeepSeek R1 Distill Llama 8B", - "display_name": "DeepSeek R1 Distill Llama 8B", + "id": "gemma-4-31B-it", + "name": "Gemma 4 31B", + "display_name": "Gemma 4 31B", "modalities": { "input": [ + "text", + "image" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 256000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-04-22", + "last_updated": "2026-04-30", + "cost": { + "input": 0.18, + "output": 0.5 + }, + "type": "chat" + }, + { + "id": "anthropic-claude-3.7-sonnet", + "name": "Claude 3.7 Sonnet", + "display_name": "Claude 3.7 Sonnet", + "modalities": { + "input": [ + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2024-11", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "qwen-long", - "name": "Qwen Long", - "display_name": "Qwen Long", + "id": "llama3-8b-instruct", + "name": "Llama 3.1 Instruct (8B)", + "display_name": "Llama 3.1 Instruct (8B)", "modalities": { "input": [ "text" @@ -40021,76 +40807,90 @@ ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-25", - "last_updated": "2025-01-25", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.072, - "output": 0.287 + "input": 0.198, + "output": 0.198 }, "type": "chat" }, { - "id": "kimi/kimi-k2.5", - "name": "kimi/kimi-k2.5", - "display_name": "kimi/kimi-k2.5", + "id": "anthropic-claude-opus-4.7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], "interleaved": true, "summaries": true, - "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "MiniMax/MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "gte-large-en-v1.5", + "name": "GTE Large (v1.5)", + "display_name": "GTE Large (v1.5)", "modalities": { "input": [ "text" @@ -40100,73 +40900,83 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 8192, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2024-03-27", + "last_updated": "2026-04-16", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0.09, + "output": 0 }, "type": "chat" }, { - "id": "siliconflow/deepseek-v3-0324", - "name": "siliconflow/deepseek-v3-0324", - "display_name": "siliconflow/deepseek-v3-0324", + "id": "anthropic-claude-4.6-sonnet", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-26", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.25, - "output": 1 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.3, + "cache_write": 3.75, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.3, + "cache_write": 3.75 + } }, "type": "chat" }, { - "id": "siliconflow/deepseek-v3.2", - "name": "siliconflow/deepseek-v3.2", - "display_name": "siliconflow/deepseek-v3.2", + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ "text" @@ -40176,8 +40986,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -40191,30 +41001,32 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-03", - "last_updated": "2025-12-03", + "open_weights": true, + "release_date": "2025-01-30", + "last_updated": "2025-01-30", "cost": { - "input": 0.27, - "output": 0.42 + "input": 0.99, + "output": 0.99 }, "type": "chat" }, { - "id": "siliconflow/deepseek-r1-0528", - "name": "siliconflow/deepseek-r1-0528", - "display_name": "siliconflow/deepseek-r1-0528", + "id": "anthropic-claude-opus-4.5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -40222,31 +41034,23 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-11-25", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.5, - "output": 2.18 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "siliconflow/deepseek-v3.1-terminus", - "name": "siliconflow/deepseek-v3.1-terminus", - "display_name": "siliconflow/deepseek-v3.1-terminus", + "id": "multi-qa-mpnet-base-dot-v1", + "name": "Multi-QA-mpnet-base-dot-v1", + "display_name": "Multi-QA-mpnet-base-dot-v1", "modalities": { "input": [ "text" @@ -40256,29 +41060,28 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 512, + "output": 768 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2021-08-30", + "last_updated": "2026-04-16", "cost": { - "input": 0.27, - "output": 1 + "input": 0.009, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "qwen-2.5-14b-instruct", + "name": "Qwen 2.5 14B Instruct", + "display_name": "Qwen 2.5 14B Instruct", "modalities": { "input": [ "text" @@ -40288,8 +41091,8 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -40298,19 +41101,15 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", - "cost": { - "input": 1, - "output": 5 - }, + "knowledge": "2024-09", + "release_date": "2024-09-19", + "last_updated": "2024-09-19", "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "e5-large-v2", + "name": "E5 Large v2", + "display_name": "E5 Large v2", "modalities": { "input": [ "text" @@ -40320,53 +41119,41 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 512, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2023-05-19", + "last_updated": "2026-04-30", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 0.02, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "anthropic-claude-opus-4", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -40374,60 +41161,60 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "qwen3-coder-plus-2025-09-23", - "name": "Qwen3 Coder Plus 2025 09 23", - "display_name": "Qwen3 Coder Plus 2025 09 23", + "id": "openai-gpt-image-1.5", + "name": "GPT Image 1.5", + "display_name": "GPT Image 1.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-25", + "last_updated": "2025-11-25", + "cost": { + "input": 5, + "output": 10, + "cache_read": 1 + }, "type": "chat" }, { - "id": "qwen3-coder-plus-2025-07-22", - "name": "Qwen3 Coder Plus 2025 07 22", - "display_name": "Qwen3 Coder Plus 2025 07 22", + "id": "llama-4-maverick", + "name": "Llama 4 Maverick 17B 128E Instruct", + "display_name": "Llama 4 Maverick 17B 128E Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -40435,123 +41222,186 @@ }, "limit": { "context": 1000000, - "output": 65536 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2026-04-30", + "cost": { + "input": 0.25, + "output": 0.87 + }, "type": "chat" }, { - "id": "qwen-vl-ocr-latest", - "name": "Qwen Vl Ocr Latest", - "display_name": "Qwen Vl Ocr Latest", + "id": "openai-gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 34096, - "output": 4096 + "context": 1000000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", + "cost": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, - "attachment": false, "type": "chat" }, { - "id": "qvq-max-2025-05-15", - "name": "Qvq Max 2025 05 15", - "display_name": "Qvq Max 2025 05 15", + "id": "anthropic-claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 16384, - "min": 0, - "max": 16384 + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.3, + "cache_write": 3.75, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.3, + "cache_write": 3.75 } }, - "attachment": false, "type": "chat" }, { - "id": "qwen-turbo-latest", - "name": "Qwen Turbo Latest", - "display_name": "Qwen Turbo Latest", + "id": "openai-o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", + "cost": { + "input": 15, + "output": 60, + "cache_read": 7.5 }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "type": "chat" + }, + { + "id": "wan2-2-t2v-a14b", + "name": "Wan2.2-T2V-A14B", + "display_name": "Wan2.2-T2V-A14B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "video" + ] + }, + "limit": { + "context": 100, + "output": 1 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false }, "attachment": false, + "open_weights": true, + "release_date": "2025-07-28", + "last_updated": "2026-04-30", + "cost": { + "input": 0.6, + "output": 0 + }, "type": "chat" }, { - "id": "qwen-turbo-2024-09-19", - "name": "Qwen Turbo 2024 09 19", - "display_name": "Qwen Turbo 2024 09 19", + "id": "anthropic-claude-3.5-haiku", + "name": "Claude 3.5 Haiku", + "display_name": "Claude 3.5 Haiku", "modalities": { "input": [ "text" @@ -40561,7 +41411,7 @@ ] }, "limit": { - "context": 131072, + "context": 200000, "output": 8192 }, "temperature": true, @@ -40570,12 +41420,22 @@ "supported": false }, "attachment": false, + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-11-05", + "last_updated": "2024-11-05", + "cost": { + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 + }, "type": "chat" }, { - "id": "qwen-flash-2025-07-28", - "name": "Qwen Flash 2025 07 28", - "display_name": "Qwen Flash 2025 07 28", + "id": "bge-m3", + "name": "BGE M3", + "display_name": "BGE M3", "modalities": { "input": [ "text" @@ -40585,115 +41445,129 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 8192, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2024-01-30", + "last_updated": "2026-04-30", + "cost": { + "input": 0.02, + "output": 0 }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "type": "embedding" + }, + { + "id": "mistral-3-14B", + "name": "Ministral 3 14B Instruct", + "display_name": "Ministral 3 14B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, "attachment": false, + "open_weights": true, + "release_date": "2025-12-15", + "last_updated": "2026-04-30", + "cost": { + "input": 0.2, + "output": 0.2 + }, "type": "chat" }, { - "id": "qwen-plus-latest", - "name": "Qwen Plus Latest", - "display_name": "Qwen Plus Latest", + "id": "openai-gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", + "cost": { + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, - "attachment": false, "type": "chat" }, { - "id": "qwen-plus-2024-09-19", - "name": "Qwen Plus 2024 09 19", - "display_name": "Qwen Plus 2024 09 19", + "id": "anthropic-claude-3-opus", + "name": "Claude 3 Opus", + "display_name": "Claude 3 Opus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, + "open_weights": false, + "knowledge": "2023-08", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", + "cost": { + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + }, "type": "chat" }, { - "id": "qwen-plus-2025-07-14", - "name": "Qwen Plus 2025 07 14", - "display_name": "Qwen Plus 2025 07 14", + "id": "glm-5", + "name": "GLM 5", + "display_name": "GLM 5", "modalities": { "input": [ "text" @@ -40703,19 +41577,13 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 202752, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -40728,41 +41596,38 @@ ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-04-16", + "cost": { + "input": 1, + "output": 3.2 + }, "type": "chat" }, { - "id": "qwen-plus-2025-09-11", - "name": "Qwen Plus 2025 09 11", - "display_name": "Qwen Plus 2025 09 11", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -40775,19 +41640,21 @@ ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", + "cost": { + "input": 0.95, + "output": 4 }, - "attachment": false, "type": "chat" }, { - "id": "qwen-max-latest", - "name": "Qwen Max Latest", - "display_name": "Qwen Max Latest", + "id": "openai-gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ "text" @@ -40798,137 +41665,162 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "search": { "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2025-08-05", + "last_updated": "2026-04-16", + "cost": { + "input": 0.1, + "output": 0.7 + }, "type": "chat" }, { - "id": "qwen-max-2024-09-19", - "name": "Qwen Max 2024 09 19", - "display_name": "Qwen Max 2024 09 19", + "id": "fal-ai/fast-sdxl", + "name": "Fast SDXL", + "display_name": "Fast SDXL", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 32768, + "context": 8192, "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, + "open_weights": true, + "release_date": "2023-07-26", + "last_updated": "2026-04-16", "type": "chat" }, { - "id": "qwen-max-2024-04-28", - "name": "Qwen Max 2024 04 28", - "display_name": "Qwen Max 2024 04 28", + "id": "fal-ai/flux/schnell", + "name": "FLUX.1 [schnell]", + "display_name": "FLUX.1 [schnell]", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, + "open_weights": true, + "release_date": "2024-08-01", + "last_updated": "2026-04-16", "type": "chat" }, { - "id": "qwen-max-2024-04-03", - "name": "Qwen Max 2024 04 03", - "display_name": "Qwen Max 2024 04 03", - "modalities": { - "input": [ + "id": "fal-ai/elevenlabs/tts/multilingual-v2", + "name": "ElevenLabs Multilingual TTS v2", + "display_name": "ElevenLabs Multilingual TTS v2", + "modalities": { + "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2023-08-22", + "last_updated": "2026-04-16", "type": "chat" }, { - "id": "qwen-max-2025-01-25", - "name": "Qwen Max 2025 01 25", - "display_name": "Qwen Max 2025 01 25", + "id": "fal-ai/stable-audio-25/text-to-audio", + "name": "Stable Audio 2.5 (Text-to-Audio)", + "display_name": "Stable Audio 2.5 (Text-to-Audio)", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 131072, + "context": 8192, "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, + "open_weights": false, + "release_date": "2025-10-08", + "last_updated": "2026-04-16", "type": "chat" - }, + } + ] + }, + "moonshot-ai": { + "id": "moonshot-ai", + "name": "Moonshot AI", + "display_name": "Moonshot AI", + "api": "https://api.moonshot.ai/v1", + "doc": "https://platform.moonshot.ai/docs/api/chat", + "models": [ { - "id": "qwen3-max-2025-09-23", - "name": "Qwen3 Max 20250923", - "display_name": "Qwen3 Max 20250923", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -40936,26 +41828,41 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false - }, - "search": { "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", + "cost": { + "input": 0.6, + "output": 3, + "cache_read": 0.1 + }, "type": "chat" }, { - "id": "qwen3-max-preview", - "name": "Qwen3 Max Preview", - "display_name": "Qwen3 Max Preview", + "id": "kimi-k2-0905-preview", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -40966,37 +41873,29 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "supported": false }, "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "cost": { + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + }, "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -41006,19 +41905,14 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -41032,36 +41926,21 @@ } }, "attachment": false, - "type": "chat" - }, - { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "cost": { + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, - "attachment": false, "type": "chat" }, { - "id": "qwen3-30b-a3b-instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", + "id": "kimi-k2-0711-preview", + "name": "Kimi K2 0711", + "display_name": "Kimi K2 0711", "modalities": { "input": [ "text" @@ -41072,7 +41951,7 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -41080,12 +41959,21 @@ "supported": false }, "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", + "cost": { + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b-thinking-2507", - "name": "Qwen3 30B A3B Thinking 2507", - "display_name": "Qwen3 30B A3B Thinking 2507", + "id": "kimi-k2-thinking-turbo", + "name": "Kimi K2 Thinking Turbo", + "display_name": "Kimi K2 Thinking Turbo", "modalities": { "input": [ "text" @@ -41095,19 +41983,14 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -41121,34 +42004,40 @@ } }, "attachment": false, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "cost": { + "input": 1.15, + "output": 8, + "cache_read": 0.15 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -41161,13 +42050,22 @@ ] } }, - "attachment": false, + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", + "cost": { + "input": 0.95, + "output": 4, + "cache_read": 0.16 + }, "type": "chat" }, { - "id": "qwen3-4b", - "name": "Qwen3 4B", - "display_name": "Qwen3 4B", + "id": "kimi-k2-turbo-preview", + "name": "Kimi K2 Turbo", + "display_name": "Kimi K2 Turbo", "modalities": { "input": [ "text" @@ -41177,162 +42075,136 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "cost": { + "input": 2.4, + "output": 10, + "cache_read": 0.6 + }, "type": "chat" - }, + } + ] + }, + "mistral": { + "id": "mistral", + "name": "Mistral", + "display_name": "Mistral", + "doc": "https://docs.mistral.ai/getting-started/models/", + "models": [ { - "id": "qwen3-1.7b", - "name": "Qwen3 1.7B", - "display_name": "Qwen3 1.7B", + "id": "mistral-medium-2604", + "name": "Mistral Medium 3.5", + "display_name": "Mistral Medium 3.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 30720, - "min": 0, - "max": 30720 - } + "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": true, + "open_weights": true, + "release_date": "2026-04-29", + "last_updated": "2026-04-29", + "cost": { + "input": 1.5, + "output": 7.5 }, - "attachment": false, "type": "chat" }, { - "id": "qwen3-0.6b", - "name": "Qwen3 0.6B", - "display_name": "Qwen3 0.6B", + "id": "mistral-large-2512", + "name": "Mistral Large 3", + "display_name": "Mistral Large 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 30720, - "min": 0, - "max": 30720 - } + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": true, + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", + "cost": { + "input": 0.5, + "output": 1.5 }, - "attachment": false, "type": "chat" }, { - "id": "qwen3-vl-plus-2025-09-23", - "name": "Qwen3 VL Plus 2025 09 23", - "display_name": "Qwen3 VL Plus 2025 09 23", + "id": "ministral-3b-latest", + "name": "Ministral 3B (latest)", + "display_name": "Ministral 3B (latest)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-04", + "cost": { + "input": 0.04, + "output": 0.04 + }, "type": "chat" }, { - "id": "qwq-plus-latest", - "name": "QwQ Plus Latest", - "display_name": "QwQ Plus Latest", + "id": "mistral-large-2411", + "name": "Mistral Large 2.1", + "display_name": "Mistral Large 2.1", "modalities": { "input": [ "text" @@ -41343,49 +42215,28 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 32768, - "min": 0, - "max": 32768 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "search": { "supported": false }, "attachment": false, + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2024-11-04", + "cost": { + "input": 2, + "output": 6 + }, "type": "chat" - } - ] - }, - "firepass": { - "id": "firepass", - "name": "Fireworks (Firepass)", - "display_name": "Fireworks (Firepass)", - "api": "https://api.fireworks.ai/inference/v1/", - "doc": "https://docs.fireworks.ai/firepass", - "models": [ + }, { - "id": "accounts/fireworks/routers/kimi-k2p6-turbo", - "name": "Kimi K2.6 Turbo", - "display_name": "Kimi K2.6 Turbo", + "id": "pixtral-12b", + "name": "Pixtral 12B", + "display_name": "Pixtral 12B", "modalities": { "input": [ "text", @@ -41396,50 +42247,29 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "knowledge": "2024-09", + "release_date": "2024-09-01", + "last_updated": "2024-09-01", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.15, + "output": 0.15 }, "type": "chat" - } - ] - }, - "minimax-cn-coding-plan": { - "id": "minimax-cn-coding-plan", - "name": "MiniMax Coding Plan (minimaxi.com)", - "display_name": "MiniMax Coding Plan (minimaxi.com)", - "api": "https://api.minimaxi.com/anthropic/v1", - "doc": "https://platform.minimaxi.com/docs/coding-plan/intro", - "models": [ + }, { - "id": "MiniMax-M2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "codestral-latest", + "name": "Codestral (latest)", + "display_name": "Codestral (latest)", "modalities": { "input": [ "text" @@ -41449,34 +42279,29 @@ ] }, "limit": { - "context": 196608, - "output": 128000 + "context": 256000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "knowledge": "2024-10", + "release_date": "2024-05-29", + "last_updated": "2025-01-04", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "open-mixtral-8x22b", + "name": "Mixtral 8x22B", + "display_name": "Mixtral 8x22B", "modalities": { "input": [ "text" @@ -41486,47 +42311,41 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 64000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2024-04", + "release_date": "2024-04-17", + "last_updated": "2024-04-17", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "mistral-small-latest", + "name": "Mistral Small (latest)", + "display_name": "Mistral Small (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -41534,44 +42353,33 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-06", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "MiniMax-M2.7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "mistral-small-2603", + "name": "Mistral Small 4", + "display_name": "Mistral Small 4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -41579,33 +42387,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-06", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -41615,34 +42411,29 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2024-07", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0, - "output": 0 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "MiniMax-M2.5-highspeed", - "name": "MiniMax-M2.5-highspeed", - "display_name": "MiniMax-M2.5-highspeed", + "id": "open-mistral-7b", + "name": "Mistral 7B", + "display_name": "Mistral 7B", "modalities": { "input": [ "text" @@ -41652,83 +42443,62 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 8000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-13", - "last_updated": "2026-02-13", + "knowledge": "2023-12", + "release_date": "2023-09-27", + "last_updated": "2023-09-27", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.25, + "output": 0.25 }, "type": "chat" - } - ] - }, - "bailing": { - "id": "bailing", - "name": "Bailing", - "display_name": "Bailing", - "api": "https://api.tbox.cn/api/llm/v1/chat/completions", - "doc": "https://alipaytbox.yuque.com/sxs0ba/ling/intro", - "models": [ + }, { - "id": "Ring-1T", - "name": "Ring-1T", - "display_name": "Ring-1T", + "id": "mistral-medium-2508", + "name": "Mistral Medium 3.1", + "display_name": "Mistral Medium 3.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-10", - "last_updated": "2025-10", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-08-12", + "last_updated": "2025-08-12", "cost": { - "input": 0.57, - "output": 2.29 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "Ling-1T", - "name": "Ling-1T", - "display_name": "Ling-1T", + "id": "devstral-medium-2507", + "name": "Devstral Medium", + "display_name": "Devstral Medium", "modalities": { "input": [ "text" @@ -41739,7 +42509,7 @@ }, "limit": { "context": 128000, - "output": 32000 + "output": 128000 }, "temperature": true, "tool_call": true, @@ -41748,28 +42518,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-10", - "last_updated": "2025-10", + "knowledge": "2025-05", + "release_date": "2025-07-10", + "last_updated": "2025-07-10", "cost": { - "input": 0.57, - "output": 2.29 + "input": 0.4, + "output": 2 }, "type": "chat" - } - ] - }, - "iflowcn": { - "id": "iflowcn", - "name": "iFlow", - "display_name": "iFlow", - "api": "https://apis.iflow.cn/v1", - "doc": "https://platform.iflow.cn/en/docs", - "models": [ + }, { - "id": "qwen3-coder-plus", - "name": "Qwen3-Coder-Plus", - "display_name": "Qwen3-Coder-Plus", + "id": "devstral-small-2505", + "name": "Devstral Small 2505", + "display_name": "Devstral Small 2505", "modalities": { "input": [ "text" @@ -41779,8 +42540,8 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -41789,19 +42550,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3-32B", - "display_name": "Qwen3-32B", + "id": "devstral-2512", + "name": "Devstral 2", + "display_name": "Devstral 2", "modalities": { "input": [ "text" @@ -41811,40 +42572,29 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "cost": { - "input": 0, - "output": 0 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "magistral-medium-latest", + "name": "Magistral Medium (latest)", + "display_name": "Magistral Medium (latest)", "modalities": { "input": [ "text" @@ -41855,7 +42605,7 @@ }, "limit": { "context": 128000, - "output": 32000 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -41863,32 +42613,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2025-06", + "release_date": "2025-03-17", + "last_updated": "2025-03-20", "cost": { - "input": 0, - "output": 0 + "input": 2, + "output": 5 }, "type": "chat" }, { - "id": "qwen3-max", - "name": "Qwen3-Max", - "display_name": "Qwen3-Max", + "id": "magistral-small", + "name": "Magistral Small", + "display_name": "Magistral Small", "modalities": { "input": [ "text" @@ -41898,40 +42637,30 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-03-17", + "last_updated": "2025-03-17", "cost": { - "input": 0, - "output": 0 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct", - "name": "Qwen3-235B-A22B-Instruct", - "display_name": "Qwen3-235B-A22B-Instruct", + "id": "devstral-small-2507", + "name": "Devstral Small", + "display_name": "Devstral Small", "modalities": { "input": [ "text" @@ -41941,8 +42670,8 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -41951,63 +42680,52 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "knowledge": "2025-05", + "release_date": "2025-07-10", + "last_updated": "2025-07-10", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen3-235B-A22B-Thinking", - "display_name": "Qwen3-235B-A22B-Thinking", + "id": "mistral-medium-2505", + "name": "Mistral Medium 3", + "display_name": "Mistral Medium 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0, - "output": 0 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "kimi-k2-0905", - "name": "Kimi-K2-0905", - "display_name": "Kimi-K2-0905", + "id": "devstral-medium-latest", + "name": "Devstral 2 (latest)", + "display_name": "Devstral 2 (latest)", "modalities": { "input": [ "text" @@ -42017,8 +42735,8 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -42026,58 +42744,53 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0, - "output": 0 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "mistral-small-2506", + "name": "Mistral Small 3.2", + "display_name": "Mistral Small 3.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2025-11-13", + "open_weights": true, + "knowledge": "2025-03", + "release_date": "2025-06-20", + "last_updated": "2025-06-20", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen3-vl-plus", - "name": "Qwen3-VL-Plus", - "display_name": "Qwen3-VL-Plus", + "id": "mistral-large-latest", + "name": "Mistral Large (latest)", + "display_name": "Mistral Large (latest)", "modalities": { "input": [ "text", @@ -42088,67 +42801,52 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", "cost": { - "input": 0, - "output": 0 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek-V3.2-Exp", - "display_name": "DeepSeek-V3.2-Exp", + "id": "labs-devstral-small-2512", + "name": "Devstral Small 2", + "display_name": "Devstral Small 2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "cost": { "input": 0, "output": 0 @@ -42156,9 +42854,9 @@ "type": "chat" }, { - "id": "qwen3-235b", - "name": "Qwen3-235B-A22B", - "display_name": "Qwen3-235B-A22B", + "id": "mistral-embed", + "name": "Mistral Embed", + "display_name": "Mistral Embed", "modalities": { "input": [ "text" @@ -42168,30 +42866,28 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 8000, + "output": 3072 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": false, + "release_date": "2023-12-11", + "last_updated": "2023-12-11", "cost": { - "input": 0, + "input": 0.1, "output": 0 }, "type": "chat" }, { - "id": "kimi-k2", - "name": "Kimi-K2", - "display_name": "Kimi-K2", + "id": "open-mixtral-8x7b", + "name": "Mixtral 8x7B", + "display_name": "Mixtral 8x7B", "modalities": { "input": [ "text" @@ -42201,8 +42897,8 @@ ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 32000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -42210,20 +42906,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "knowledge": "2024-01", + "release_date": "2023-12-11", + "last_updated": "2023-12-11", "cost": { - "input": 0, - "output": 0 + "input": 0.7, + "output": 0.7 }, "type": "chat" }, { - "id": "qwen3-max-preview", - "name": "Qwen3-Max-Preview", - "display_name": "Qwen3-Max-Preview", + "id": "ministral-8b-latest", + "name": "Ministral 8B (latest)", + "display_name": "Ministral 8B (latest)", "modalities": { "input": [ "text" @@ -42233,43 +42929,33 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-04", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "deepseek-v3", - "name": "DeepSeek-V3", - "display_name": "DeepSeek-V3", + "id": "pixtral-large-latest", + "name": "Pixtral Large (latest)", + "display_name": "Pixtral Large (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -42277,36 +42963,28 @@ }, "limit": { "context": 128000, - "output": 32000 + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-26", - "last_updated": "2024-12-26", + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2024-11-04", "cost": { - "input": 0, - "output": 0 + "input": 2, + "output": 6 }, "type": "chat" - } - ] - }, - "v0": { - "id": "v0", - "name": "v0", - "display_name": "v0", - "doc": "https://sdk.vercel.ai/providers/ai-sdk-providers/vercel", - "models": [ + }, { - "id": "v0-1.5-lg", - "name": "v0-1.5-lg", - "display_name": "v0-1.5-lg", + "id": "mistral-medium-latest", + "name": "Mistral Medium (latest)", + "display_name": "Mistral Medium (latest)", "modalities": { "input": [ "text", @@ -42317,8 +42995,8 @@ ] }, "limit": { - "context": 512000, - "output": 32000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -42327,31 +43005,39 @@ "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2025-06-09", - "last_updated": "2025-06-09", + "open_weights": true, + "release_date": "2026-04-29", + "last_updated": "2026-04-29", "cost": { - "input": 15, - "output": 75 + "input": 1.5, + "output": 7.5 }, "type": "chat" - }, + } + ] + }, + "kilo": { + "id": "kilo", + "name": "Kilo Gateway", + "display_name": "Kilo Gateway", + "api": "https://api.kilo.ai/api/gateway", + "doc": "https://kilo.ai", + "models": [ { - "id": "v0-1.0-md", - "name": "v0-1.0-md", - "display_name": "v0-1.0-md", + "id": "prime-intellect/intellect-3", + "name": "Prime Intellect: INTELLECT-3", + "display_name": "Prime Intellect: INTELLECT-3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -42359,74 +43045,93 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "release_date": "2025-11-26", + "last_updated": "2026-02-04", "cost": { - "input": 3, - "output": 15 + "input": 0.2, + "output": 1.1 }, "type": "chat" }, { - "id": "v0-1.5-md", - "name": "v0-1.5-md", - "display_name": "v0-1.5-md", + "id": "liquid/lfm-2-24b-a2b", + "name": "LiquidAI: LFM2-24B-A2B", + "display_name": "LiquidAI: LFM2-24B-A2B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-09", - "last_updated": "2025-06-09", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-26", + "last_updated": "2026-03-15", "cost": { - "input": 3, - "output": 15 + "input": 0.03, + "output": 0.12 }, "type": "chat" - } - ] - }, - "huggingface": { - "id": "huggingface", - "name": "Hugging Face", - "display_name": "Hugging Face", - "api": "https://router.huggingface.co/v1", - "doc": "https://huggingface.co/docs/inference-providers", - "models": [ + }, { - "id": "Qwen/Qwen3.5-397B-A17B", - "name": "Qwen3.5-397B-A17B", - "display_name": "Qwen3.5-397B-A17B", + "id": "undi95/remm-slerp-l2-13b", + "name": "ReMM SLERP 13B", + "display_name": "ReMM SLERP 13B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 6144, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-07-22", + "last_updated": "2026-03-15", + "cost": { + "input": 0.45, + "output": 0.65 + }, + "type": "chat" + }, + { + "id": "inception/mercury-2", + "name": "Inception: Mercury 2", + "display_name": "Inception: Mercury 2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 50000 }, "temperature": true, "tool_call": true, @@ -42434,32 +43139,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-01", - "last_updated": "2026-02-01", + "attachment": false, + "open_weights": false, + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0.6, - "output": 3.6 + "input": 0.25, + "output": 0.75, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-Next", - "name": "Qwen3-Coder-Next", - "display_name": "Qwen3-Coder-Next", + "id": "sao10k/l3.1-70b-hanami-x1", + "name": "Sao10K: Llama 3.1 70B Hanami x1", + "display_name": "Sao10K: Llama 3.1 70B Hanami x1", "modalities": { "input": [ "text" @@ -42469,29 +43163,28 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 16000, + "output": 16000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-03", - "last_updated": "2026-02-03", + "release_date": "2025-01-08", + "last_updated": "2026-03-15", "cost": { - "input": 0.2, - "output": 1.5 + "input": 3, + "output": 3 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "name": "Qwen3-Next-80B-A3B-Instruct", - "display_name": "Qwen3-Next-80B-A3B-Instruct", + "id": "sao10k/l3.1-euryale-70b", + "name": "Sao10K: Llama 3.1 Euryale 70B v2.2", + "display_name": "Sao10K: Llama 3.1 Euryale 70B v2.2", "modalities": { "input": [ "text" @@ -42501,8 +43194,8 @@ ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -42511,19 +43204,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-11", - "last_updated": "2025-09-11", + "release_date": "2024-08-28", + "last_updated": "2026-03-15", "cost": { - "input": 0.25, - "output": 1 + "input": 0.85, + "output": 0.85 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Embedding-8B", - "name": "Qwen 3 Embedding 8B", - "display_name": "Qwen 3 Embedding 8B", + "id": "sao10k/l3-lunaris-8b", + "name": "Sao10K: Llama 3 8B Lunaris", + "display_name": "Sao10K: Llama 3 8B Lunaris", "modalities": { "input": [ "text" @@ -42533,29 +43225,28 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 8192, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2024-08-13", + "last_updated": "2026-03-15", "cost": { - "input": 0.01, - "output": 0 + "input": 0.04, + "output": 0.05 }, - "type": "embedding" + "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen3-235B-A22B-Thinking-2507", + "id": "sao10k/l3-euryale-70b", + "name": "Sao10k: Llama 3 Euryale 70B v2.1", + "display_name": "Sao10k: Llama 3 Euryale 70B v2.1", "modalities": { "input": [ "text" @@ -42565,41 +43256,28 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "release_date": "2024-06-18", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 3 + "input": 1.48, + "output": 1.48 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "name": "Qwen3-Next-80B-A3B-Thinking", - "display_name": "Qwen3-Next-80B-A3B-Thinking", + "id": "sao10k/l3.3-euryale-70b", + "name": "Sao10K: Llama 3.3 Euryale 70B", + "display_name": "Sao10K: Llama 3.3 Euryale 70B", "modalities": { "input": [ "text" @@ -42609,40 +43287,28 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 131072, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-11", - "last_updated": "2025-09-11", + "release_date": "2024-12-18", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 2 + "input": 0.65, + "output": 0.75 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Embedding-4B", - "name": "Qwen 3 Embedding 4B", - "display_name": "Qwen 3 Embedding 4B", + "id": "ibm-granite/granite-4.0-h-micro", + "name": "IBM: Granite 4.0 Micro", + "display_name": "IBM: Granite 4.0 Micro", "modalities": { "input": [ "text" @@ -42652,29 +43318,28 @@ ] }, "limit": { - "context": 32000, - "output": 2048 + "context": 131000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-10-20", + "last_updated": "2026-03-15", "cost": { - "input": 0.01, - "output": 0 + "input": 0.017, + "output": 0.11 }, - "type": "embedding" + "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen3-Coder-480B-A35B-Instruct", - "display_name": "Qwen3-Coder-480B-A35B-Instruct", + "id": "ibm-granite/granite-4.1-8b", + "name": "IBM: Granite 4.1 8B", + "display_name": "IBM: Granite 4.1 8B", "modalities": { "input": [ "text" @@ -42684,8 +43349,8 @@ ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -42693,20 +43358,20 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "release_date": "2026-04-30", + "last_updated": "2026-05-01", "cost": { - "input": 2, - "output": 2 + "input": 0.05, + "output": 0.1, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7-Flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "cohere/command-r-08-2024", + "name": "Cohere: Command R (08-2024)", + "display_name": "Cohere: Command R (08-2024)", "modalities": { "input": [ "text" @@ -42716,41 +43381,28 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0, - "output": 0 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "cohere/command-r-plus-08-2024", + "name": "Cohere: Command R+ (08-2024)", + "display_name": "Cohere: Command R+ (08-2024)", "modalities": { "input": [ "text" @@ -42760,42 +43412,28 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "cohere/command-r7b-12-2024", + "name": "Cohere: Command R7B (12-2024)", + "display_name": "Cohere: Command R7B (12-2024)", "modalities": { "input": [ "text" @@ -42805,41 +43443,28 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-04-03", - "last_updated": "2026-04-03", + "release_date": "2024-02-27", + "last_updated": "2024-02-27", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 0.0375, + "output": 0.15 }, "type": "chat" }, { - "id": "zai-org/GLM-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "cohere/command-a", + "name": "Cohere: Command A", + "display_name": "Cohere: Command A", "modalities": { "input": [ "text" @@ -42849,41 +43474,28 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 256000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "XiaomiMiMo/MiMo-V2-Flash", - "name": "MiMo-V2-Flash", - "display_name": "MiMo-V2-Flash", + "id": "thedrummer/unslopnemo-12b", + "name": "TheDrummer: UnslopNemo 12B", + "display_name": "TheDrummer: UnslopNemo 12B", "modalities": { "input": [ "text" @@ -42893,30 +43505,28 @@ ] }, "limit": { - "context": 262144, - "output": 4096 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "release_date": "2024-11-09", + "last_updated": "2026-03-15", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "thedrummer/cydonia-24b-v4.1", + "name": "TheDrummer: Cydonia 24B V4.1", + "display_name": "TheDrummer: Cydonia 24B V4.1", "modalities": { "input": [ "text" @@ -42926,41 +43536,28 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "release_date": "2025-09-27", + "last_updated": "2026-03-15", "cost": { - "input": 3, - "output": 5 + "input": 0.3, + "output": 0.5 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "thedrummer/rocinante-12b", + "name": "TheDrummer: Rocinante 12B", + "display_name": "TheDrummer: Rocinante 12B", "modalities": { "input": [ "text" @@ -42970,35 +43567,28 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2024-09-30", + "last_updated": "2026-03-15", "cost": { - "input": 0.28, - "output": 0.4 + "input": 0.17, + "output": 0.43 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "Kimi-K2-Thinking", - "display_name": "Kimi-K2-Thinking", + "id": "thedrummer/skyfall-36b-v2", + "name": "TheDrummer: Skyfall 36B V2", + "display_name": "TheDrummer: Skyfall 36B V2", "modalities": { "input": [ "text" @@ -43008,89 +43598,60 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "release_date": "2025-03-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 0.55, + "output": 0.8 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "Kimi-K2.6", - "display_name": "Kimi-K2.6", + "id": "bytedance/ui-tars-1.5-7b", + "name": "ByteDance: UI-TARS 7B ", + "display_name": "ByteDance: UI-TARS 7B ", "modalities": { "input": [ - "text", "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-20", - "last_updated": "2026-04-20", + "open_weights": false, + "release_date": "2025-07-23", + "last_updated": "2026-03-15", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.1, + "output": 0.2 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct", - "name": "Kimi-K2-Instruct", - "display_name": "Kimi-K2-Instruct", + "id": "alfredpros/codellama-7b-instruct-solidity", + "name": "AlfredPros: CodeLLaMa 7B Instruct Solidity", + "display_name": "AlfredPros: CodeLLaMa 7B Instruct Solidity", "modalities": { "input": [ "text" @@ -43100,29 +43661,28 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 4096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-14", - "last_updated": "2025-07-14", + "release_date": "2025-04-14", + "last_updated": "2026-03-15", "cost": { - "input": 1, - "output": 3 + "input": 0.8, + "output": 1.2 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "Kimi-K2-Instruct-0905", - "display_name": "Kimi-K2-Instruct-0905", + "id": "deepcogito/cogito-v2.1-671b", + "name": "Deep Cogito: Cogito v2.1 671B", + "display_name": "Deep Cogito: Cogito v2.1 671B", "modalities": { "input": [ "text" @@ -43132,34 +43692,33 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 128000, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-04", - "last_updated": "2025-09-04", + "release_date": "2025-11-14", + "last_updated": "2026-03-15", "cost": { - "input": 1, - "output": 3 + "input": 1.25, + "output": 1.25 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi-K2.5", - "display_name": "Kimi-K2.5", + "id": "moonshotai/kimi-k2.5", + "name": "MoonshotAI: Kimi K2.5", + "display_name": "MoonshotAI: Kimi K2.5", "modalities": { "input": [ - "text", "image", - "video" + "text" ], "output": [ "text" @@ -43167,7 +43726,7 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 65535 }, "temperature": true, "tool_call": true, @@ -43188,20 +43747,18 @@ }, "attachment": true, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-01", - "last_updated": "2026-01-01", + "release_date": "2026-01-27", + "last_updated": "2026-03-15", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 0.45, + "output": 2.2 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "moonshotai/kimi-k2-0905", + "name": "MoonshotAI: Kimi K2 0905", + "display_name": "MoonshotAI: Kimi K2 0905", "modalities": { "input": [ "text" @@ -43211,41 +43768,29 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 0.4, + "output": 2, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "moonshotai/kimi-k2-thinking", + "name": "MoonshotAI: Kimi K2 Thinking", + "display_name": "MoonshotAI: Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -43255,8 +43800,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -43277,19 +43822,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2025-11-06", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.47, + "output": 2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "moonshotai/kimi-k2", + "name": "MoonshotAI: Kimi K2 0711", + "display_name": "MoonshotAI: Kimi K2 0711", "modalities": { "input": [ "text" @@ -43299,52 +43844,40 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131000, + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-10", - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "release_date": "2025-07-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.55, + "output": 2.2 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V4-Pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "moonshotai/kimi-k2.6", + "name": "MoonshotAI: Kimi K2.6", + "display_name": "MoonshotAI: Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 262144, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -43354,40 +43887,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2026-04-20", + "last_updated": "2026-05-12", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 0.75, + "output": 3.5, + "cache_read": 0.375 }, "type": "chat" - } - ] - }, - "upstage": { - "id": "upstage", - "name": "Upstage", - "display_name": "Upstage", - "api": "https://api.upstage.ai/v1/solar", - "doc": "https://developers.upstage.ai/docs/apis/chat", - "models": [ + }, { - "id": "solar-pro2", - "name": "solar-pro2", - "display_name": "solar-pro2", + "id": "morph/morph-v3-large", + "name": "Morph: Morph V3 Large", + "display_name": "Morph: Morph V3 Large", "modalities": { "input": [ "text" @@ -43397,30 +43914,28 @@ ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 262144, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 0.25, - "output": 0.25 - }, + "input": 0.9, + "output": 1.9 + }, "type": "chat" }, { - "id": "solar-mini", - "name": "solar-mini", - "display_name": "solar-mini", + "id": "morph/morph-v3-fast", + "name": "Morph: Morph V3 Fast", + "display_name": "Morph: Morph V3 Fast", "modalities": { "input": [ "text" @@ -43430,40 +43945,41 @@ ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 81920, + "output": 38000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-06-12", - "last_updated": "2025-04-22", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.8, + "output": 1.2 }, "type": "chat" }, { - "id": "solar-pro3", - "name": "solar-pro3", - "display_name": "solar-pro3", + "id": "bytedance-seed/seed-1.6-flash", + "name": "ByteDance Seed: Seed 1.6 Flash", + "display_name": "ByteDance Seed: Seed 1.6 Flash", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -43471,41 +43987,33 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-03", - "release_date": "2026-01", - "last_updated": "2026-01", + "attachment": true, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2026-03-15", "cost": { - "input": 0.25, - "output": 0.25 + "input": 0.075, + "output": 0.3 }, "type": "chat" - } - ] - }, - "novita-ai": { - "id": "novita-ai", - "name": "NovitaAI", - "display_name": "NovitaAI", - "api": "https://api.novita.ai/openai", - "doc": "https://novita.ai/docs/guides/introduction", - "models": [ + }, { - "id": "deepseek/deepseek-r1-turbo", - "name": "DeepSeek R1 (Turbo)\t", - "display_name": "DeepSeek R1 (Turbo)\t", + "id": "bytedance-seed/seed-1.6", + "name": "ByteDance Seed: Seed 1.6", + "display_name": "ByteDance Seed: Seed 1.6", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16000 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -43513,153 +44021,160 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-03-05", - "last_updated": "2025-03-05", + "attachment": true, + "open_weights": false, + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 0.7, - "output": 2.5 + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3-0324", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "bytedance-seed/seed-2.0-mini", + "name": "ByteDance Seed: Seed-2.0-Mini", + "display_name": "ByteDance Seed: Seed-2.0-Mini", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "release_date": "2026-02-27", + "last_updated": "2026-03-15", "cost": { - "input": 0.27, - "output": 1.12, - "cache_read": 0.135 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "deepseek/deepseek-ocr-2", - "name": "deepseek/deepseek-ocr-2", - "display_name": "deepseek/deepseek-ocr-2", + "id": "bytedance-seed/seed-2.0-lite", + "name": "ByteDance Seed: Seed-2.0-Lite", + "display_name": "ByteDance Seed: Seed-2.0-Lite", "modalities": { "input": [ + "image", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "release_date": "2026-03-10", + "last_updated": "2026-03-15", "cost": { - "input": 0.03, - "output": 0.03 + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "deepseek/deepseek-ocr", - "name": "DeepSeek-OCR", - "display_name": "DeepSeek-OCR", + "id": "z-ai/glm-5.1", + "name": "Z.ai: GLM 5.1", + "display_name": "Z.ai: GLM 5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 202752, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": true, - "release_date": "2025-10-24", - "last_updated": "2025-10-24", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.03, - "output": 0.03 + "input": 1.26, + "output": 3.96 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill LLama 70B", - "display_name": "DeepSeek R1 Distill LLama 70B", + "id": "z-ai/glm-5v-turbo", + "name": "Z.ai: GLM 5V Turbo", + "display_name": "Z.ai: GLM 5V Turbo", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 202752, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-01-27", - "last_updated": "2025-01-27", + "release_date": "2026-04-01", + "last_updated": "2026-04-11", "cost": { - "input": 0.8, - "output": 0.8 + "input": 1.2, + "output": 4, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "deepseek/deepseek-prover-v2-671b", - "name": "Deepseek Prover V2 671B", - "display_name": "Deepseek Prover V2 671B", + "id": "z-ai/glm-4.5-air", + "name": "Z.ai: GLM 4.5 Air", + "display_name": "Z.ai: GLM 4.5 Air", "modalities": { "input": [ "text" @@ -43669,60 +44184,64 @@ ] }, "limit": { - "context": 160000, - "output": 160000 + "context": 131072, + "output": 98304 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-04-30", - "last_updated": "2025-04-30", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.7, - "output": 2.5 + "input": 0.13, + "output": 0.85, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-0528-qwen3-8b", - "name": "DeepSeek R1 0528 Qwen3 8B", - "display_name": "DeepSeek R1 0528 Qwen3 8B", + "id": "z-ai/glm-4.5v", + "name": "Z.ai: GLM 4.5V", + "display_name": "Z.ai: GLM 4.5V", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 65536, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-05-29", - "last_updated": "2025-05-29", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "cost": { - "input": 0.06, - "output": 0.09 + "input": 0.6, + "output": 1.8, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-distill-qwen-32b", - "name": "DeepSeek R1 Distill Qwen 32B", - "display_name": "DeepSeek R1 Distill Qwen 32B", + "id": "z-ai/glm-4.7-flash", + "name": "Z.ai: GLM 4.7 Flash", + "display_name": "Z.ai: GLM 4.7 Flash", "modalities": { "input": [ "text" @@ -43732,29 +44251,35 @@ ] }, "limit": { - "context": 64000, - "output": 32000 + "context": 202752, + "output": 40551 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.3, - "output": 0.3 + "input": 0.06, + "output": 0.4, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-exp", - "name": "Deepseek V3.2 Exp", - "display_name": "Deepseek V3.2 Exp", + "id": "z-ai/glm-4.6", + "name": "Z.ai: GLM 4.6", + "display_name": "Z.ai: GLM 4.6", "modalities": { "input": [ "text" @@ -43764,8 +44289,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 204800, + "output": 204800 }, "temperature": true, "tool_call": true, @@ -43773,20 +44298,26 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-09-30", + "last_updated": "2026-03-15", "cost": { - "input": 0.27, - "output": 0.41 + "input": 0.39, + "output": 1.9, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "z-ai/glm-4.5", + "name": "Z.ai: GLM 4.5", + "display_name": "Z.ai: GLM 4.5", "modalities": { "input": [ "text" @@ -43797,7 +44328,7 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 98304 }, "temperature": true, "tool_call": true, @@ -43807,19 +44338,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "release_date": "2025-07-28", + "last_updated": "2026-03-15", "cost": { - "input": 0.27, - "output": 1, - "cache_read": 0.135 + "input": 0.6, + "output": 2.2, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2", - "name": "Deepseek V3.2", - "display_name": "Deepseek V3.2", + "id": "z-ai/glm-5-turbo", + "name": "Z.ai: GLM 5 Turbo", + "display_name": "Z.ai: GLM 5 Turbo", "modalities": { "input": [ "text" @@ -43829,8 +44360,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -43840,30 +44371,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2026-03-15", + "last_updated": "2026-04-11", "cost": { - "input": 0.269, - "output": 0.4, - "cache_read": 0.1345 + "input": 1.2, + "output": 4, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3-turbo", - "name": "DeepSeek V3 (Turbo)\t", - "display_name": "DeepSeek V3 (Turbo)\t", + "id": "z-ai/glm-4.7", + "name": "Z.ai: GLM 4.7", + "display_name": "Z.ai: GLM 4.7", "modalities": { "input": [ "text" @@ -43873,28 +44398,41 @@ ] }, "limit": { - "context": 64000, - "output": 16000 + "context": 202752, + "output": 65535 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2025-03-05", - "last_updated": "2025-03-05", + "release_date": "2025-12-22", + "last_updated": "2026-03-15", "cost": { - "input": 0.4, - "output": 1.3 + "input": 0.38, + "output": 1.98, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-distill-qwen-14b", - "name": "DeepSeek R1 Distill Qwen 14B", - "display_name": "DeepSeek R1 Distill Qwen 14B", + "id": "z-ai/glm-4-32b", + "name": "Z.ai: GLM 4 32B ", + "display_name": "Z.ai: GLM 4 32B ", "modalities": { "input": [ "text" @@ -43904,29 +44442,28 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2025-07-25", + "last_updated": "2026-03-15", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", + "id": "z-ai/glm-5", + "name": "Z.ai: GLM 5", + "display_name": "Z.ai: GLM 5", "modalities": { "input": [ "text" @@ -43936,8 +44473,8 @@ ] }, "limit": { - "context": 163840, - "output": 32768 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -43958,23 +44495,23 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "release_date": "2026-02-12", + "last_updated": "2026-03-15", "cost": { - "input": 0.7, - "output": 2.5, - "cache_read": 0.35 + "input": 0.72, + "output": 2.3 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1-terminus", - "name": "Deepseek V3.1 Terminus", - "display_name": "Deepseek V3.1 Terminus", + "id": "z-ai/glm-4.6v", + "name": "Z.ai: GLM 4.6V", + "display_name": "Z.ai: GLM 4.6V", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" @@ -43982,7 +44519,7 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -43990,23 +44527,24 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "release_date": "2025-09-30", + "last_updated": "2026-01-10", "cost": { - "input": 0.27, - "output": 1, - "cache_read": 0.135 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "inclusionai/ling-2.6-1t", - "name": "Ling-2.6-1T", - "display_name": "Ling-2.6-1T", + "id": "openai/gpt-4o", + "name": "OpenAI: GPT-4o", + "display_name": "OpenAI: GPT-4o", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -44014,62 +44552,64 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "attachment": true, + "open_weights": false, + "release_date": "2024-05-13", + "last_updated": "2026-03-15", "cost": { - "input": 0, - "output": 0 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "paddlepaddle/paddleocr-vl", - "name": "PaddleOCR-VL", - "display_name": "PaddleOCR-VL", + "id": "openai/gpt-4o-mini-search-preview", + "name": "OpenAI: GPT-4o-mini Search Preview", + "display_name": "OpenAI: GPT-4o-mini Search Preview", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 16384, + "context": 128000, "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-10-22", - "last_updated": "2025-10-22", + "attachment": false, + "open_weights": false, + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 0.02, - "output": 0.02 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "nousresearch/hermes-2-pro-llama-3-8b", - "name": "Hermes 2 Pro Llama 3 8B", - "display_name": "Hermes 2 Pro Llama 3 8B", + "id": "openai/gpt-5.2", + "name": "OpenAI: GPT-5.2", + "display_name": "OpenAI: GPT-5.2", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -44077,28 +44617,52 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-06-27", - "last_updated": "2024-06-27", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.14, - "output": 0.14 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "zai-org/glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "openai/gpt-3.5-turbo", + "name": "OpenAI: GPT-3.5 Turbo", + "display_name": "OpenAI: GPT-3.5 Turbo", "modalities": { "input": [ "text" @@ -44108,43 +44672,32 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 16385, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": false, + "release_date": "2023-03-01", + "last_updated": "2023-11-06", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "zai-org/glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "openai/o3-pro", + "name": "OpenAI: o3 Pro", + "display_name": "OpenAI: o3 Pro", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -44152,10 +44705,10 @@ ] }, "limit": { - "context": 202800, - "output": 131072 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -44164,29 +44717,31 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-12", + "attachment": true, + "open_weights": false, + "release_date": "2025-04-16", + "last_updated": "2026-03-15", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 20, + "output": 80 }, "type": "chat" }, { - "id": "zai-org/glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "openai/gpt-3.5-turbo-16k", + "name": "OpenAI: GPT-3.5 Turbo 16k", + "display_name": "OpenAI: GPT-3.5 Turbo 16k", "modalities": { "input": [ "text" @@ -44196,43 +44751,32 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 16385, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "open_weights": false, + "release_date": "2023-08-28", + "last_updated": "2026-03-15", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 3, + "output": 4 }, "type": "chat" }, { - "id": "zai-org/glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "openai/gpt-5.4-nano", + "name": "OpenAI: GPT-5.4 Nano", + "display_name": "OpenAI: GPT-5.4 Nano", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -44240,52 +44784,66 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-17", + "last_updated": "2026-04-11", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "zai-org/glm-4.5-air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "openai/gpt-5-image-mini", + "name": "OpenAI: GPT-5 Image Mini", + "display_name": "OpenAI: GPT-5 Image Mini", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ + "image", "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -44293,59 +44851,62 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-10-13", - "last_updated": "2025-10-13", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-16", + "last_updated": "2026-03-15", "cost": { - "input": 0.13, - "output": 0.85 + "input": 2.5, + "output": 2 }, "type": "chat" }, { - "id": "zai-org/glm-4.5v", - "name": "GLM 4.5V", - "display_name": "GLM 4.5V", + "id": "openai/gpt-5.5-pro", + "name": "OpenAI: GPT-5.5 Pro", + "display_name": "OpenAI: GPT-5.5 Pro", "modalities": { "input": [ "text", - "video", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "open_weights": false, + "release_date": "2026-04-24", + "last_updated": "2026-05-01", "cost": { - "input": 0.6, - "output": 1.8, - "cache_read": 0.11 + "input": 30, + "output": 180 }, "type": "chat" }, { - "id": "zai-org/glm-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "openai/gpt-5.1-codex-mini", + "name": "OpenAI: GPT-5.1-Codex-Mini", + "display_name": "OpenAI: GPT-5.1-Codex-Mini", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -44353,79 +44914,109 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 400000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "attachment": true, + "open_weights": false, + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.55, - "output": 2.2, - "cache_read": 0.11 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "zai-org/glm-4.6v", - "name": "GLM 4.6V", - "display_name": "GLM 4.6V", + "id": "openai/gpt-5.2-pro", + "name": "OpenAI: GPT-5.2 Pro", + "display_name": "OpenAI: GPT-5.2 Pro", "modalities": { "input": [ - "text", - "video", - "image" + "image", + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "open_weights": false, + "release_date": "2025-12-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 0.9, - "cache_read": 0.055 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "zai-org/glm-4.7-flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "openai/gpt-4o-2024-05-13", + "name": "OpenAI: GPT-4o (2024-05-13)", + "display_name": "OpenAI: GPT-4o (2024-05-13)", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -44433,99 +45024,117 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "attachment": true, + "open_weights": false, + "release_date": "2024-05-13", + "last_updated": "2026-03-15", "cost": { - "input": 0.07, - "output": 0.4, - "cache_read": 0.01 + "input": 5, + "output": 15 }, "type": "chat" }, { - "id": "zai-org/autoglm-phone-9b-multilingual", - "name": "AutoGLM-Phone-9B-Multilingual", - "display_name": "AutoGLM-Phone-9B-Multilingual", + "id": "openai/gpt-4-0314", + "name": "OpenAI: GPT-4 (older v0314)", + "display_name": "OpenAI: GPT-4 (older v0314)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 8191, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-12-10", - "last_updated": "2025-12-10", + "attachment": false, + "open_weights": false, + "release_date": "2023-05-28", + "last_updated": "2026-03-15", "cost": { - "input": 0.035, - "output": 0.138 + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "mistralai/mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "openai/gpt-5.4-image-2", + "name": "OpenAI: GPT-5.4 Image 2", + "display_name": "OpenAI: GPT-5.4 Image 2", "modalities": { "input": [ - "text" + "image", + "text", + "pdf" ], "output": [ + "image", "text" ] }, "limit": { - "context": 60288, - "output": 16000 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-30", - "last_updated": "2024-07-30", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-04-21", + "last_updated": "2026-05-01", "cost": { - "input": 0.04, - "output": 0.17 + "input": 8, + "output": 15, + "cache_read": 2 }, "type": "chat" }, { - "id": "baichuan/baichuan-m2-32b", - "name": "baichuan-m2-32b", - "display_name": "baichuan-m2-32b", + "id": "openai/gpt-3.5-turbo-instruct", + "name": "OpenAI: GPT-3.5 Turbo Instruct", + "display_name": "OpenAI: GPT-3.5 Turbo Instruct", "modalities": { "input": [ "text" @@ -44535,8 +45144,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 4095, + "output": 4096 }, "temperature": true, "tool_call": false, @@ -44544,21 +45153,20 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-08-13", - "last_updated": "2025-08-13", + "open_weights": false, + "release_date": "2023-03-01", + "last_updated": "2023-09-21", "cost": { - "input": 0.07, - "output": 0.07 + "input": 1.5, + "output": 2 }, "type": "chat" }, { - "id": "meta-llama/llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout Instruct", - "display_name": "Llama 4 Scout Instruct", - "modalities": { + "id": "openai/gpt-5-codex", + "name": "OpenAI: GPT-5 Codex", + "display_name": "OpenAI: GPT-5 Codex", + "modalities": { "input": [ "text", "image" @@ -44568,30 +45176,55 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-04-06", - "last_updated": "2025-04-06", + "open_weights": false, + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.18, - "output": 0.59 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "meta-llama/llama-3.3-70b-instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "openai/gpt-5.1-chat", + "name": "OpenAI: GPT-5.1 Chat", + "display_name": "OpenAI: GPT-5.1 Chat", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -44599,31 +45232,33 @@ ] }, "limit": { - "context": 131072, - "output": 120000 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-07", - "last_updated": "2024-12-07", + "attachment": true, + "open_weights": false, + "release_date": "2025-11-13", + "last_updated": "2026-03-15", "cost": { - "input": 0.135, - "output": 0.4 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "meta-llama/llama-3.2-3b-instruct", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "openai/gpt-4.1", + "name": "OpenAI: GPT-4.1", + "display_name": "OpenAI: GPT-4.1", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -44631,39 +45266,42 @@ ] }, "limit": { - "context": 32768, - "output": 32000 + "context": 1047576, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-09-18", - "last_updated": "2024-09-18", + "attachment": true, + "open_weights": false, + "release_date": "2025-04-14", + "last_updated": "2026-03-15", "cost": { - "input": 0.03, - "output": 0.05 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "meta-llama/llama-3-8b-instruct", - "name": "Llama 3 8B Instruct", - "display_name": "Llama 3 8B Instruct", + "id": "openai/gpt-audio", + "name": "OpenAI: GPT Audio", + "display_name": "OpenAI: GPT Audio", "modalities": { "input": [ + "audio", "text" ], "output": [ + "audio", "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": false, @@ -44671,19 +45309,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-04-25", - "last_updated": "2024-04-25", + "open_weights": false, + "release_date": "2026-01-20", + "last_updated": "2026-03-15", "cost": { - "input": 0.04, - "output": 0.04 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "meta-llama/llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "openai/gpt-4o-search-preview", + "name": "OpenAI: GPT-4o Search Preview", + "display_name": "OpenAI: GPT-4o Search Preview", "modalities": { "input": [ "text" @@ -44693,28 +45331,27 @@ ] }, "limit": { - "context": 16384, + "context": 128000, "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-07-24", - "last_updated": "2024-07-24", + "open_weights": false, + "release_date": "2025-03-13", + "last_updated": "2026-03-15", "cost": { - "input": 0.02, - "output": 0.05 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "meta-llama/llama-3-70b-instruct", - "name": "Llama3 70B Instruct", - "display_name": "Llama3 70B Instruct", + "id": "openai/gpt-oss-20b", + "name": "OpenAI: gpt-oss-20b", + "display_name": "OpenAI: gpt-oss-20b", "modalities": { "input": [ "text" @@ -44724,62 +45361,71 @@ ] }, "limit": { - "context": 8192, - "output": 8000 + "context": 131072, + "output": 26215 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2024-04-25", - "last_updated": "2024-04-25", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.51, - "output": 0.74 + "input": 0.03, + "output": 0.14 }, "type": "chat" }, { - "id": "meta-llama/llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama 4 Maverick Instruct", - "display_name": "Llama 4 Maverick Instruct", + "id": "openai/gpt-oss-safeguard-20b", + "name": "OpenAI: gpt-oss-safeguard-20b", + "display_name": "OpenAI: gpt-oss-safeguard-20b", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 131072, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-04-06", - "last_updated": "2025-04-06", + "attachment": false, + "open_weights": false, + "release_date": "2025-10-29", + "last_updated": "2025-10-29", "cost": { - "input": 0.27, - "output": 0.85 + "input": 0.075, + "output": 0.3, + "cache_read": 0.037 }, "type": "chat" }, { - "id": "gryphe/mythomax-l2-13b", - "name": "Mythomax L2 13B", - "display_name": "Mythomax L2 13B", + "id": "openai/gpt-5-pro", + "name": "OpenAI: GPT-5 Pro", + "display_name": "OpenAI: GPT-5 Pro", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -44787,30 +45433,48 @@ ] }, "limit": { - "context": 4096, - "output": 3200 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-25", - "last_updated": "2024-04-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-06", + "last_updated": "2026-03-15", "cost": { - "input": 0.09, - "output": 0.09 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "sao10k/l31-70b-euryale-v2.2", - "name": "L31 70B Euryale V2.2", - "display_name": "L31 70B Euryale V2.2", + "id": "openai/gpt-4.1-mini", + "name": "OpenAI: GPT-4.1 Mini", + "display_name": "OpenAI: GPT-4.1 Mini", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -44818,28 +45482,29 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-09-19", - "last_updated": "2024-09-19", + "attachment": true, + "open_weights": false, + "release_date": "2025-04-14", + "last_updated": "2026-03-15", "cost": { - "input": 1.48, - "output": 1.48 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "sao10k/l3-70b-euryale-v2.1", - "name": "L3 70B Euryale V2.1\t", - "display_name": "L3 70B Euryale V2.1\t", + "id": "openai/gpt-4-turbo-preview", + "name": "OpenAI: GPT-4 Turbo Preview", + "display_name": "OpenAI: GPT-4 Turbo Preview", "modalities": { "input": [ "text" @@ -44849,8 +45514,8 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -44858,30 +45523,32 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-06-18", - "last_updated": "2024-06-18", + "open_weights": false, + "release_date": "2024-01-25", + "last_updated": "2026-03-15", "cost": { - "input": 1.48, - "output": 1.48 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "sao10k/L3-8B-Stheno-v3.2", - "name": "L3 8B Stheno V3.2", - "display_name": "L3 8B Stheno V3.2", + "id": "openai/gpt-4o-audio-preview", + "name": "OpenAI: GPT-4o Audio", + "display_name": "OpenAI: GPT-4o Audio", "modalities": { "input": [ + "audio", "text" ], "output": [ + "audio", "text" ] }, "limit": { - "context": 8192, - "output": 32000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -44889,52 +45556,58 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-11-29", - "last_updated": "2024-11-29", + "open_weights": false, + "release_date": "2025-08-15", + "last_updated": "2026-03-15", "cost": { - "input": 0.05, - "output": 0.05 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "sao10k/l3-8b-lunaris", - "name": "Sao10k L3 8B Lunaris\t", - "display_name": "Sao10k L3 8B Lunaris\t", + "id": "openai/gpt-5-image", + "name": "OpenAI: GPT-5 Image", + "display_name": "OpenAI: GPT-5 Image", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ + "image", "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-11-28", - "last_updated": "2024-11-28", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-14", + "last_updated": "2026-03-15", "cost": { - "input": 0.05, - "output": 0.05 + "input": 10, + "output": 10 }, "type": "chat" }, { - "id": "microsoft/wizardlm-2-8x22b", - "name": "Wizardlm 2 8x22B", - "display_name": "Wizardlm 2 8x22B", + "id": "openai/gpt-5.1", + "name": "OpenAI: GPT-5.1", + "display_name": "OpenAI: GPT-5.1", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -44942,104 +45615,162 @@ ] }, "limit": { - "context": 65535, - "output": 8000 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-24", - "last_updated": "2024-04-24", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-13", + "last_updated": "2026-03-15", "cost": { - "input": 0.62, - "output": 0.62 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "OpenAI: GPT OSS 20B", - "display_name": "OpenAI: GPT OSS 20B", + "id": "openai/gpt-5-nano", + "name": "OpenAI: GPT-5 Nano", + "display_name": "OpenAI: GPT-5 Nano", "modalities": { "input": [ - "text", - "image" + "image", + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", + "open_weights": false, + "release_date": "2025-08-07", + "last_updated": "2026-03-15", "cost": { - "input": 0.04, - "output": 0.15 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "OpenAI GPT OSS 120B", - "display_name": "OpenAI GPT OSS 120B", + "id": "openai/gpt-5.4", + "name": "OpenAI: GPT-5.4", + "display_name": "OpenAI: GPT-5.4", "modalities": { "input": [ - "text", - "image" + "image", + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1050000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", + "open_weights": false, + "release_date": "2026-03-06", + "last_updated": "2026-03-15", "cost": { - "input": 0.05, - "output": 0.25 + "input": 2.5, + "output": 15 }, "type": "chat" }, { - "id": "minimaxai/minimax-m1-80k", - "name": "MiniMax M1", - "display_name": "MiniMax M1", + "id": "openai/gpt-4-1106-preview", + "name": "OpenAI: GPT-4 Turbo (older v1106)", + "display_name": "OpenAI: GPT-4 Turbo (older v1106)", "modalities": { "input": [ "text" @@ -45049,31 +45780,32 @@ ] }, "limit": { - "context": 1000000, - "output": 40000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "open_weights": false, + "release_date": "2023-11-06", + "last_updated": "2026-03-15", "cost": { - "input": 0.55, - "output": 2.2 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "xiaomimimo/mimo-v2-flash", - "name": "XiaomiMiMo/MiMo-V2-Flash", - "display_name": "XiaomiMiMo/MiMo-V2-Flash", + "id": "openai/gpt-4o-mini", + "name": "OpenAI: GPT-4o-mini", + "display_name": "OpenAI: GPT-4o-mini", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -45081,65 +45813,77 @@ ] }, "limit": { - "context": 262144, - "output": 32000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-12-19", - "last_updated": "2025-12-19", + "attachment": true, + "open_weights": false, + "release_date": "2024-07-18", + "last_updated": "2026-03-15", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.3 + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-vl-28b-a3b-thinking", - "name": "ERNIE-4.5-VL-28B-A3B-Thinking", - "display_name": "ERNIE-4.5-VL-28B-A3B-Thinking", + "id": "openai/o1-pro", + "name": "OpenAI: o1-pro", + "display_name": "OpenAI: o1-pro", "modalities": { "input": [ - "text", "image", - "video" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, - "open_weights": true, - "release_date": "2025-11-26", - "last_updated": "2025-11-26", + "open_weights": false, + "release_date": "2025-03-19", + "last_updated": "2026-03-15", "cost": { - "input": 0.39, - "output": 0.39 + "input": 150, + "output": 600 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-vl-424b-a47b", - "name": "ERNIE 4.5 VL 424B A47B", - "display_name": "ERNIE 4.5 VL 424B A47B", + "id": "openai/gpt-4-turbo", + "name": "OpenAI: GPT-4 Turbo", + "display_name": "OpenAI: GPT-4 Turbo", "modalities": { "input": [ "text", @@ -45150,31 +45894,32 @@ ] }, "limit": { - "context": 123000, - "output": 16000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-06-30", - "last_updated": "2025-06-30", + "open_weights": false, + "release_date": "2023-09-13", + "last_updated": "2024-04-09", "cost": { - "input": 0.42, - "output": 1.25 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-21B-a3b", - "name": "ERNIE 4.5 21B A3B", - "display_name": "ERNIE 4.5 21B A3B", + "id": "openai/gpt-5.4-mini", + "name": "OpenAI: GPT-5.4 Mini", + "display_name": "OpenAI: GPT-5.4 Mini", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -45182,31 +45927,56 @@ ] }, "limit": { - "context": 120000, - "output": 8000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-06-30", - "last_updated": "2025-06-30", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-03-17", + "last_updated": "2026-04-11", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-300b-a47b-paddle", - "name": "ERNIE 4.5 300B A47B", - "display_name": "ERNIE 4.5 300B A47B", + "id": "openai/o1", + "name": "OpenAI: o1", + "display_name": "OpenAI: o1", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -45214,28 +45984,44 @@ ] }, "limit": { - "context": 123000, - "output": 12000 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-30", - "last_updated": "2025-06-30", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-12-05", + "last_updated": "2026-03-15", "cost": { - "input": 0.28, - "output": 1.1 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-21B-a3b-thinking", - "name": "ERNIE-4.5-21B-A3B-Thinking", - "display_name": "ERNIE-4.5-21B-A3B-Thinking", + "id": "openai/gpt-3.5-turbo-0613", + "name": "OpenAI: GPT-3.5 Turbo (older v0613)", + "display_name": "OpenAI: GPT-3.5 Turbo (older v0613)", "modalities": { "input": [ "text" @@ -45245,120 +46031,146 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 4095, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "open_weights": false, + "release_date": "2023-06-13", + "last_updated": "2023-06-13", "cost": { - "input": 0.07, - "output": 0.28 + "input": 1, + "output": 2 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-vl-28b-a3b", - "name": "ERNIE 4.5 VL 28B A3B", - "display_name": "ERNIE 4.5 VL 28B A3B", + "id": "openai/o3-mini-high", + "name": "OpenAI: o3 Mini High", + "display_name": "OpenAI: o3 Mini High", "modalities": { "input": [ - "text", - "image" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 30000, - "output": 8000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, - "open_weights": true, - "release_date": "2025-06-30", - "last_updated": "2025-06-30", + "open_weights": false, + "release_date": "2025-01-31", + "last_updated": "2026-03-15", "cost": { - "input": 1.4, - "output": 5.6 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "minimax/minimax-m2.7", - "name": "MiniMax M2.7", - "display_name": "MiniMax M2.7", + "id": "openai/gpt-5.1-codex-max", + "name": "OpenAI: GPT-5.1-Codex-Max", + "display_name": "OpenAI: GPT-5.1-Codex-Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "minimax/minimax-m2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "openai/gpt-5.5", + "name": "OpenAI: GPT-5.5", + "display_name": "OpenAI: GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -45367,31 +46179,43 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-24", + "last_updated": "2026-05-01", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 5, + "output": 30, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "minimax/minimax-m2.1", - "name": "Minimax M2.1", - "display_name": "Minimax M2.1", + "id": "openai/gpt-5.4-pro", + "name": "OpenAI: GPT-5.4 Pro", + "display_name": "OpenAI: GPT-5.4 Pro", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -45399,42 +46223,52 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1050000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-06", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 30, + "output": 180 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "openai/o4-mini-high", + "name": "OpenAI: o4 Mini High", + "display_name": "OpenAI: o4 Mini High", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -45442,10 +46276,9 @@ ] }, "limit": { - "context": 204800, - "output": 131100 + "context": 200000, + "output": 100000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -45454,31 +46287,35 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2025-04-17", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 1.1, + "output": 4.4 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5-highspeed", - "name": "MiniMax M2.5 Highspeed", - "display_name": "MiniMax M2.5 Highspeed", + "id": "openai/o4-mini-deep-research", + "name": "OpenAI: o4 Mini Deep Research", + "display_name": "OpenAI: o4 Mini Deep Research", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -45486,8 +46323,8 @@ ] }, "limit": { - "context": 204800, - "output": 131100 + "context": 200000, + "output": 100000 }, "temperature": true, "tool_call": true, @@ -45498,31 +46335,36 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2024-06-26", + "last_updated": "2026-03-15", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.03 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "qwen/qwen2.5-7b-instruct", - "name": "Qwen2.5 7B Instruct", - "display_name": "Qwen2.5 7B Instruct", + "id": "openai/gpt-4.1-nano", + "name": "OpenAI: GPT-4.1 Nano", + "display_name": "OpenAI: GPT-4.1 Nano", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -45530,88 +46372,75 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "attachment": true, + "open_weights": false, + "release_date": "2025-04-14", + "last_updated": "2026-03-15", "cost": { - "input": 0.07, - "output": 0.07 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "qwen/qwen3.5-122b-a10b", - "name": "Qwen3.5-122B-A10B", - "display_name": "Qwen3.5-122B-A10B", + "id": "openai/gpt-4", + "name": "OpenAI: GPT-4", + "display_name": "OpenAI: GPT-4", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 8191, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "attachment": false, + "open_weights": false, + "release_date": "2023-03-14", + "last_updated": "2024-04-09", "cost": { - "input": 0.4, - "output": 3.2 + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "qwen/qwen3.6-27b", - "name": "Qwen3.6-27B", - "display_name": "Qwen3.6-27B", + "id": "openai/o4-mini", + "name": "OpenAI: o4 Mini", + "display_name": "OpenAI: o4 Mini", "modalities": { "input": [ - "text", "image", - "video" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -45620,76 +46449,91 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "release_date": "2025-04-16", + "last_updated": "2026-03-15", "cost": { - "input": 0.6, - "output": 3.6 + "input": 1.1, + "output": 4.4, + "cache_read": 0.275 }, "type": "chat" }, { - "id": "qwen/qwen3.5-27b", - "name": "Qwen3.5-27B", - "display_name": "Qwen3.5-27B", + "id": "openai/gpt-5.1-codex", + "name": "OpenAI: GPT-5.1-Codex", + "display_name": "OpenAI: GPT-5.1-Codex", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "open_weights": false, + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.3, - "output": 2.4 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "openai/gpt-4o-2024-11-20", + "name": "OpenAI: GPT-4o (2024-11-20)", + "display_name": "OpenAI: GPT-4o (2024-11-20)", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -45697,7 +46541,7 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 16384 }, "temperature": true, @@ -45705,153 +46549,159 @@ "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-22", - "last_updated": "2025-07-22", + "attachment": true, + "open_weights": false, + "release_date": "2024-11-20", + "last_updated": "2026-03-15", "cost": { - "input": 0.09, - "output": 0.58 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "qwen/qwen3-omni-30b-a3b-instruct", - "name": "Qwen3 Omni 30B A3B Instruct", - "display_name": "Qwen3 Omni 30B A3B Instruct", + "id": "openai/gpt-5.2-codex", + "name": "OpenAI: GPT-5.2-Codex", + "display_name": "OpenAI: GPT-5.2-Codex", "modalities": { "input": [ "text", - "video", - "audio", "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "open_weights": false, + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 0.25, - "output": 0.97, - "input_audio": 2.2, - "output_audio": 1.788 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "qwen/qwen3.5-397b-a17b", - "name": "Qwen3.5-397B-A17B", - "display_name": "Qwen3.5-397B-A17B", + "id": "openai/gpt-5-chat", + "name": "OpenAI: GPT-5 Chat", + "display_name": "OpenAI: GPT-5 Chat", "modalities": { "input": [ - "text", "image", - "video" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 64000 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "open_weights": false, + "release_date": "2025-08-07", + "last_updated": "2026-03-15", "cost": { - "input": 0.6, - "output": 3.6 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen/qwen2.5-vl-72b-instruct", - "name": "Qwen2.5 VL 72B Instruct", - "display_name": "Qwen2.5 VL 72B Instruct", + "id": "openai/gpt-4o-mini-2024-07-18", + "name": "OpenAI: GPT-4o-mini (2024-07-18)", + "display_name": "OpenAI: GPT-4o-mini (2024-07-18)", "modalities": { "input": [ - "text", "image", - "video" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "open_weights": false, + "release_date": "2024-07-18", + "last_updated": "2026-03-15", "cost": { - "input": 0.8, - "output": 0.8 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-235b-a22b-thinking", - "name": "Qwen3 VL 235B A22B Thinking", - "display_name": "Qwen3 VL 235B A22B Thinking", + "id": "openai/gpt-5-mini", + "name": "OpenAI: GPT-5 Mini", + "display_name": "OpenAI: GPT-5 Mini", "modalities": { "input": [ - "text", "image", - "video" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -45859,88 +46709,100 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "open_weights": false, + "release_date": "2025-08-07", + "last_updated": "2026-03-15", "cost": { - "input": 0.98, - "output": 3.95 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-30b-a3b-thinking", - "name": "qwen/qwen3-vl-30b-a3b-thinking", - "display_name": "qwen/qwen3-vl-30b-a3b-thinking", + "id": "openai/o3-mini", + "name": "OpenAI: o3 Mini", + "display_name": "OpenAI: o3 Mini", "modalities": { "input": [ - "text", - "image", - "video" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2025-10-11", - "last_updated": "2025-10-11", + "open_weights": false, + "release_date": "2024-12-20", + "last_updated": "2026-03-15", "cost": { - "input": 0.2, - "output": 1 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "qwen/qwen3-omni-30b-a3b-thinking", - "name": "Qwen3 Omni 30B A3B Thinking", - "display_name": "Qwen3 Omni 30B A3B Thinking", + "id": "openai/gpt-5.3-codex", + "name": "OpenAI: GPT-5.3-Codex", + "display_name": "OpenAI: GPT-5.3-Codex", "modalities": { "input": [ - "text", - "audio", - "video", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -45949,65 +46811,76 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "open_weights": false, + "release_date": "2026-02-25", + "last_updated": "2026-03-15", "cost": { - "input": 0.25, - "output": 0.97, - "input_audio": 2.2, - "output_audio": 1.788 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-8b-instruct", - "name": "qwen/qwen3-vl-8b-instruct", - "display_name": "qwen/qwen3-vl-8b-instruct", + "id": "openai/gpt-5.2-chat", + "name": "OpenAI: GPT-5.2 Chat", + "display_name": "OpenAI: GPT-5.2 Chat", "modalities": { "input": [ - "text", "image", - "video" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-10-17", - "last_updated": "2025-10-17", + "open_weights": false, + "release_date": "2025-12-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.08, - "output": 0.5 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "qwen/qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "openai/gpt-4o-2024-08-06", + "name": "OpenAI: GPT-4o (2024-08-06)", + "display_name": "OpenAI: GPT-4o (2024-08-06)", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -46015,42 +46888,33 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "release_date": "2024-08-06", + "last_updated": "2026-03-15", "cost": { - "input": 2.11, - "output": 8.45 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "qwen/qwen3-32b-fp8", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "openai/gpt-chat-latest", + "name": "OpenAI: GPT Chat Latest", + "display_name": "OpenAI: GPT Chat Latest", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -46058,29 +46922,35 @@ ] }, "limit": { - "context": 40960, - "output": 20000 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-05-05", + "last_updated": "2026-05-07", "cost": { - "input": 0.1, - "output": 0.45 + "input": 5, + "output": 30, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "qwen/qwen3-4b-fp8", - "name": "Qwen3 4B", - "display_name": "Qwen3 4B", + "id": "openai/gpt-oss-120b", + "name": "OpenAI: gpt-oss-120b", + "display_name": "OpenAI: gpt-oss-120b", "modalities": { "input": [ "text" @@ -46090,75 +46960,71 @@ ] }, "limit": { - "context": 128000, - "output": 20000 + "context": 131072, + "output": 26215 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.03, - "output": 0.03 + "input": 0.039, + "output": 0.19 }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-thinking-2507", - "name": "Qwen3 235B A22b Thinking 2507", - "display_name": "Qwen3 235B A22b Thinking 2507", + "id": "openai/gpt-audio-mini", + "name": "OpenAI: GPT Audio Mini", + "display_name": "OpenAI: GPT Audio Mini", "modalities": { "input": [ + "audio", "text" ], "output": [ + "audio", "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "open_weights": false, + "release_date": "2026-01-20", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 3 + "input": 0.6, + "output": 2.4 }, "type": "chat" }, { - "id": "qwen/qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "openai/o3", + "name": "OpenAI: o3", + "display_name": "OpenAI: o3", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -46166,10 +47032,10 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -46178,30 +47044,36 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-10", - "last_updated": "2025-09-10", + "attachment": true, + "open_weights": false, + "release_date": "2025-04-16", + "last_updated": "2026-03-15", "cost": { - "input": 0.15, - "output": 1.5 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "qwen/qwen-mt-plus", - "name": "Qwen MT Plus", - "display_name": "Qwen MT Plus", + "id": "openai/o3-deep-research", + "name": "OpenAI: o3 Deep Research", + "display_name": "OpenAI: o3 Deep Research", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -46209,30 +47081,48 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 200000, + "output": 100000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-03", - "last_updated": "2025-09-03", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-06-26", + "last_updated": "2026-03-15", "cost": { - "input": 0.25, - "output": 0.75 + "input": 10, + "output": 40, + "cache_read": 2.5 }, "type": "chat" }, { - "id": "qwen/qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "openai/gpt-5.3-chat", + "name": "OpenAI: GPT-5.3 Chat", + "display_name": "OpenAI: GPT-5.3 Chat", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -46240,30 +47130,31 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-10", - "last_updated": "2025-09-10", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-04", + "last_updated": "2026-03-15", "cost": { - "input": 0.15, - "output": 1.5 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b-fp8", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "openai/gpt-5", + "name": "OpenAI: GPT-5", + "display_name": "OpenAI: GPT-5", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -46271,29 +47162,51 @@ ] }, "limit": { - "context": 40960, - "output": 20000 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-07", + "last_updated": "2026-03-15", "cost": { - "input": 0.09, - "output": 0.45 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen/qwen3-coder-next", - "name": "Qwen3 Coder Next", - "display_name": "Qwen3 Coder Next", + "id": "relace/relace-apply-3", + "name": "Relace: Relace Apply 3", + "display_name": "Relace: Relace Apply 3", "modalities": { "input": [ "text" @@ -46303,28 +47216,27 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 256000, + "output": 128000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-03", - "last_updated": "2026-02-03", + "open_weights": false, + "release_date": "2025-09-26", + "last_updated": "2026-03-15", "cost": { - "input": 0.2, - "output": 1.5 + "input": 0.85, + "output": 1.25 }, "type": "chat" }, { - "id": "qwen/qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "relace/relace-search", + "name": "Relace: Relace Search", + "display_name": "Relace: Relace Search", "modalities": { "input": [ "text" @@ -46334,8 +47246,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 256000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -46343,25 +47255,22 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "release_date": "2025-12-09", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 1.3 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-30b-a3b-instruct", - "name": "qwen/qwen3-vl-30b-a3b-instruct", - "display_name": "qwen/qwen3-vl-30b-a3b-instruct", + "id": "aion-labs/aion-1.0", + "name": "AionLabs: Aion-1.0", + "display_name": "AionLabs: Aion-1.0", "modalities": { "input": [ - "text", - "video", - "image" + "text" ], "output": [ "text" @@ -46372,24 +47281,25 @@ "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-10-11", - "last_updated": "2025-10-11", + "attachment": false, + "open_weights": false, + "release_date": "2025-02-05", + "last_updated": "2026-03-15", "cost": { - "input": 0.2, - "output": 0.7 + "input": 4, + "output": 8 }, "type": "chat" }, { - "id": "qwen/qwen3-coder-30b-a3b-instruct", - "name": "Qwen3 Coder 30b A3B Instruct", - "display_name": "Qwen3 Coder 30b A3B Instruct", + "id": "aion-labs/aion-rp-llama-3.1-8b", + "name": "AionLabs: Aion-RP 1.0 (8B)", + "display_name": "AionLabs: Aion-RP 1.0 (8B)", "modalities": { "input": [ "text" @@ -46399,28 +47309,28 @@ ] }, "limit": { - "context": 160000, + "context": 32768, "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-10-09", - "last_updated": "2025-10-09", + "open_weights": false, + "release_date": "2025-02-05", + "last_updated": "2026-03-15", "cost": { - "input": 0.07, - "output": 0.27 + "input": 0.8, + "output": 1.6 }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-fp8", - "name": "Qwen3 235B A22B", - "display_name": "Qwen3 235B A22B", + "id": "aion-labs/aion-2.0", + "name": "AionLabs: Aion-2.0", + "display_name": "AionLabs: Aion-2.0", "modalities": { "input": [ "text" @@ -46430,8 +47340,8 @@ ] }, "limit": { - "context": 40960, - "output": 20000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": false, @@ -46440,19 +47350,19 @@ "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "open_weights": false, + "release_date": "2026-02-24", + "last_updated": "2026-03-15", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.8, + "output": 1.6 }, "type": "chat" }, { - "id": "qwen/qwen3-8b-fp8", - "name": "Qwen3 8B", - "display_name": "Qwen3 8B", + "id": "aion-labs/aion-1.0-mini", + "name": "AionLabs: Aion-1.0-Mini", + "display_name": "AionLabs: Aion-1.0-Mini", "modalities": { "input": [ "text" @@ -46462,8 +47372,8 @@ ] }, "limit": { - "context": 128000, - "output": 20000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": false, @@ -46472,54 +47382,53 @@ "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "open_weights": false, + "release_date": "2025-02-05", + "last_updated": "2026-03-15", "cost": { - "input": 0.035, - "output": 0.138 + "input": 0.7, + "output": 1.4 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-235b-a22b-instruct", - "name": "Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen3 VL 235B A22B Instruct", + "id": "openrouter/pareto-code", + "name": "Pareto Code Router", + "display_name": "Pareto Code Router", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "attachment": false, + "open_weights": false, + "release_date": "2026-04-21", + "last_updated": "2026-05-01", "cost": { - "input": 0.3, - "output": 1.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwen-2.5-72b-instruct", - "name": "Qwen 2.5 72B Instruct", - "display_name": "Qwen 2.5 72B Instruct", + "id": "openrouter/free", + "name": "Free Models Router", + "display_name": "Free Models Router", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -46527,42 +47436,40 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 200000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-10-15", - "last_updated": "2024-10-15", + "attachment": true, + "open_weights": false, + "release_date": "2026-02-01", + "last_updated": "2026-03-15", "cost": { - "input": 0.38, - "output": 0.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwen3.5-35b-a3b", - "name": "Qwen3.5-35B-A3B", - "display_name": "Qwen3.5-35B-A3B", + "id": "openrouter/owl-alpha", + "name": "Owl Alpha", + "display_name": "Owl Alpha", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1048756, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -46570,31 +47477,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "attachment": false, + "open_weights": false, + "release_date": "2026-04-28", + "last_updated": "2026-04-30", "cost": { - "input": 0.25, - "output": 2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "kwaipilot/kat-coder-pro", - "name": "Kat Coder Pro", - "display_name": "Kat Coder Pro", + "id": "openrouter/bodybuilder", + "name": "Body Builder (beta)", + "display_name": "Body Builder (beta)", "modalities": { "input": [ "text" @@ -46604,41 +47500,43 @@ ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 128000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-05", - "last_updated": "2026-01-05", + "open_weights": false, + "release_date": "2026-03-15", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemma-4-31b-it", - "name": "Gemma 4 31B", - "display_name": "Gemma 4 31B", + "id": "openrouter/auto", + "name": "Auto Router", + "display_name": "Auto Router", "modalities": { "input": [ + "audio", + "image", + "pdf", "text", - "image" + "video" ], "output": [ + "image", "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 2000000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -46647,23 +47545,22 @@ "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": false, + "release_date": "2026-03-15", + "last_updated": "2026-03-15", "cost": { - "input": 0.14, - "output": 0.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemma-3-12b-it", - "name": "Gemma 3 12B", - "display_name": "Gemma 3 12B", + "id": "switchpoint/router", + "name": "Switchpoint Router", + "display_name": "Switchpoint Router", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -46671,28 +47568,59 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 32768 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-07-12", + "last_updated": "2026-03-15", + "cost": { + "input": 0.85, + "output": 3.4 + }, + "type": "chat" + }, + { + "id": "mancer/weaver", + "name": "Mancer: Weaver (alpha)", + "display_name": "Mancer: Weaver (alpha)", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8000, + "output": 2000 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "attachment": false, + "open_weights": false, + "release_date": "2023-08-02", + "last_updated": "2026-03-15", "cost": { - "input": 0.05, - "output": 0.1 + "input": 0.75, + "output": 1 }, "type": "chat" }, { - "id": "google/gemma-3-27b-it", - "name": "Gemma 3 27B", - "display_name": "Gemma 3 27B", + "id": "amazon/nova-pro-v1", + "name": "Amazon: Nova Pro 1.0", + "display_name": "Amazon: Nova Pro 1.0", "modalities": { "input": [ "text", @@ -46703,40 +47631,42 @@ ] }, "limit": { - "context": 98304, - "output": 16384 + "context": 300000, + "output": 5120 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "open_weights": false, + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.119, - "output": 0.2 + "input": 0.8, + "output": 3.2 }, "type": "chat" }, { - "id": "google/gemma-4-26b-a4b-it", - "name": "Gemma 4 26B A4B", - "display_name": "Gemma 4 26B A4B", + "id": "amazon/nova-2-lite-v1", + "name": "Amazon: Nova 2 Lite", + "display_name": "Amazon: Nova 2 Lite", "modalities": { "input": [ + "image", + "pdf", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 1000000, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -46745,66 +47675,83 @@ "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2026-03-15", "cost": { - "input": 0.13, - "output": 0.4 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "amazon/nova-lite-v1", + "name": "Amazon: Nova Lite 1.0", + "display_name": "Amazon: Nova Lite 1.0", "modalities": { "input": [ - "text", "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 300000, + "output": 5120 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": true, + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2026-03-15", + "cost": { + "input": 0.06, + "output": 0.24 + }, + "type": "chat" + }, + { + "id": "amazon/nova-premier-v1", + "name": "Amazon: Nova Premier 1.0", + "display_name": "Amazon: Nova Premier 1.0", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "open_weights": false, + "release_date": "2025-11-01", + "last_updated": "2026-03-15", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 2.5, + "output": 12.5 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "amazon/nova-micro-v1", + "name": "Amazon: Nova Micro 1.0", + "display_name": "Amazon: Nova Micro 1.0", "modalities": { "input": [ "text" @@ -46814,8 +47761,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 5120 }, "temperature": true, "tool_call": true, @@ -46823,19 +47770,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2026-03-15", "cost": { - "input": 0.57, - "output": 2.3 + "input": 0.035, + "output": 0.14 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "writer/palmyra-x5", + "name": "Writer: Palmyra X5", + "display_name": "Writer: Palmyra X5", "modalities": { "input": [ "text" @@ -46845,76 +47792,59 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1040000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "open_weights": false, + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { "input": 0.6, - "output": 2.5 + "output": 6 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "inflection/inflection-3-productivity", + "name": "Inflection: Inflection 3 Productivity", + "display_name": "Inflection: Inflection 3 Productivity", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 8000, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "attachment": false, + "open_weights": false, + "release_date": "2024-10-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "inflection/inflection-3-pi", + "name": "Inflection: Inflection 3 Pi", + "display_name": "Inflection: Inflection 3 Pi", "modalities": { "input": [ "text" @@ -46924,40 +47854,28 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 8000, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-11-07", - "last_updated": "2025-11-07", + "open_weights": false, + "release_date": "2024-10-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.6, - "output": 2.5 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "minimax/minimax-m2.1", + "name": "MiniMax: MiniMax M2.1", + "display_name": "MiniMax: MiniMax M2.1", "modalities": { "input": [ "text" @@ -46967,8 +47885,8 @@ ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 196608, + "output": 39322 }, "temperature": true, "tool_call": true, @@ -46978,31 +47896,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 0.27, + "output": 0.95, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "minimax/minimax-m2", + "name": "MiniMax: MiniMax M2", + "display_name": "MiniMax: MiniMax M2", "modalities": { "input": [ "text" @@ -47012,8 +47923,8 @@ ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 196608, + "output": 196608 }, "temperature": true, "tool_call": true, @@ -47023,70 +47934,56 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2025-10-23", + "last_updated": "2026-03-15", "cost": { - "input": 1.69, - "output": 3.38, - "cache_read": 0.13 + "input": 0.255, + "output": 1, + "cache_read": 0.03 }, "type": "chat" - } - ] - }, - "xiaomi-token-plan-cn": { - "id": "xiaomi-token-plan-cn", - "name": "Xiaomi Token Plan (China)", - "display_name": "Xiaomi Token Plan (China)", - "api": "https://token-plan-cn.xiaomimimo.com/v1", - "doc": "https://platform.xiaomimimo.com/#/docs", - "models": [ + }, { - "id": "mimo-v2-tts", - "name": "MiMo-V2-TTS", - "display_name": "MiMo-V2-TTS", + "id": "minimax/minimax-m1", + "name": "MiniMax: MiniMax M1", + "display_name": "MiniMax: MiniMax M1", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 16384 + "context": 1000000, + "output": 40000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0, - "output": 0 + "input": 0.4, + "output": 2.2 }, "type": "chat" }, { - "id": "mimo-v2.5-pro", - "name": "MiMo-V2.5-Pro", - "display_name": "MiMo-V2.5-Pro", + "id": "minimax/minimax-m2.5", + "name": "MiniMax: MiniMax M2.5", + "display_name": "MiniMax: MiniMax M2.5", "modalities": { "input": [ "text" @@ -47096,8 +47993,8 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 196608, + "output": 196608 }, "temperature": true, "tool_call": true, @@ -47107,98 +48004,65 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2026-02-12", + "last_updated": "2026-03-15", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "context_over_200k": { - "input": 0, - "output": 0, - "cache_read": 0 - } + "input": 0.25, + "output": 1.2, + "cache_read": 0.029 }, "type": "chat" }, { - "id": "mimo-v2-omni", - "name": "MiMo-V2-Omni", - "display_name": "MiMo-V2-Omni", + "id": "minimax/minimax-m2-her", + "name": "MiniMax: MiniMax M2-her", + "display_name": "MiniMax: MiniMax M2-her", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 65536, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": false, + "open_weights": true, + "release_date": "2026-01-23", + "last_updated": "2026-03-15", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "mimo-v2.5", - "name": "MiMo-V2.5", - "display_name": "MiMo-V2.5", + "id": "minimax/minimax-m2.7", + "name": "MiniMax: MiniMax M2.7", + "display_name": "MiniMax: MiniMax M2.7", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 204800, "output": 131072 }, "temperature": true, @@ -47218,79 +48082,57 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "context_over_200k": { - "input": 0, - "output": 0, - "cache_read": 0 - } + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "mimo-v2-pro", - "name": "MiMo-V2-Pro", - "display_name": "MiMo-V2-Pro", + "id": "minimax/minimax-01", + "name": "MiniMax: MiniMax-01", + "display_name": "MiniMax: MiniMax-01", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 1000192, + "output": 1000192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": true, + "release_date": "2025-01-15", + "last_updated": "2025-01-15", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0.2, + "output": 1.1 }, "type": "chat" }, { - "id": "mimo-v2-flash", - "name": "MiMo-V2-Flash", - "display_name": "MiMo-V2-Flash", + "id": "x-ai/grok-4.20", + "name": "xAI: Grok 4.20", + "display_name": "xAI: Grok 4.20", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -47298,8 +48140,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, @@ -47307,42 +48149,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-31", + "last_updated": "2026-04-11", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 2, + "output": 6, + "cache_read": 0.2 }, "type": "chat" - } - ] - }, - "wandb": { - "id": "wandb", - "name": "Weights & Biases", - "display_name": "Weights & Biases", - "api": "https://api.inference.wandb.ai/v1", - "doc": "https://docs.wandb.ai/guides/integrations/inference/", - "models": [ + }, { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", + "id": "x-ai/grok-code-fast-1:optimized:free", + "name": "xAI: Grok Code Fast 1 Optimized (experimental, free)", + "display_name": "xAI: Grok Code Fast 1 Optimized (experimental, free)", "modalities": { "input": [ "text" @@ -47352,30 +48173,33 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 10000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-29", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2025-08-27", + "last_updated": "2026-03-15", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "x-ai/grok-4.20-multi-agent", + "name": "xAI: Grok 4.20 Multi-Agent", + "display_name": "xAI: Grok 4.20 Multi-Agent", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -47383,40 +48207,43 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 2000000, + "output": 2000000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2026-03-12", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-31", + "last_updated": "2026-04-11", "cost": { - "input": 0.1, - "output": 0.1 + "input": 2, + "output": 6, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen3-235B-A22B-Thinking-2507", + "id": "x-ai/grok-4.3", + "name": "xAI: Grok 4.3", + "display_name": "xAI: Grok 4.3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -47426,30 +48253,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-25", - "last_updated": "2026-03-12", + "attachment": true, + "open_weights": false, + "release_date": "2026-05-01", + "last_updated": "2026-05-01", "cost": { - "input": 0.1, - "output": 0.1 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen3-Coder-480B-A35B-Instruct", - "display_name": "Qwen3-Coder-480B-A35B-Instruct", + "id": "kwaipilot/kat-coder-pro-v2", + "name": "Kwaipilot: KAT-Coder-Pro V2", + "display_name": "Kwaipilot: KAT-Coder-Pro V2", "modalities": { "input": [ "text" @@ -47459,8 +48280,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 80000 }, "temperature": true, "tool_call": true, @@ -47469,19 +48290,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2026-03-12", + "release_date": "2026-03-27", + "last_updated": "2026-04-11", "cost": { - "input": 1, - "output": 1.5 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "zai-org/GLM-5-FP8", - "name": "GLM 5", - "display_name": "GLM 5", + "id": "nousresearch/hermes-4-405b", + "name": "Nous: Hermes 4 405B", + "display_name": "Nous: Hermes 4 405B", "modalities": { "input": [ "text" @@ -47491,62 +48312,60 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 131072, + "output": 26215 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-03-12", + "release_date": "2025-08-25", + "last_updated": "2025-08-25", "cost": { "input": 1, - "output": 3.2 + "output": 3 }, "type": "chat" }, { - "id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", - "name": "Llama 4 Scout 17B 16E Instruct", - "display_name": "Llama 4 Scout 17B 16E Instruct", + "id": "nousresearch/hermes-3-llama-3.1-405b", + "name": "Nous: Hermes 3 405B Instruct", + "display_name": "Nous: Hermes 3 405B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 64000 + "context": 131072, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-31", - "last_updated": "2026-03-12", + "release_date": "2024-08-16", + "last_updated": "2024-08-16", "cost": { - "input": 0.17, - "output": 0.66 + "input": 1, + "output": 1 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "nousresearch/hermes-4-70b", + "name": "Nous: Hermes 4 70B", + "display_name": "Nous: Hermes 4 70B", "modalities": { "input": [ "text" @@ -47556,30 +48375,30 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2026-03-12", + "release_date": "2025-08-25", + "last_updated": "2026-03-15", "cost": { - "input": 0.71, - "output": 0.71 + "input": 0.13, + "output": 0.4, + "cache_read": 0.055 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.1-8B-Instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", + "id": "nousresearch/hermes-3-llama-3.1-70b", + "name": "Nous: Hermes 3 70B Instruct", + "display_name": "Nous: Hermes 3 70B Instruct", "modalities": { "input": [ "text" @@ -47589,30 +48408,28 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2026-03-12", + "release_date": "2024-08-18", + "last_updated": "2026-03-15", "cost": { - "input": 0.22, - "output": 0.22 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.1-70B-Instruct", - "name": "Llama 3.1 70B", - "display_name": "Llama 3.1 70B", + "id": "nousresearch/hermes-2-pro-llama-3-8b", + "name": "NousResearch: Hermes 2 Pro - Llama-3 8B", + "display_name": "NousResearch: Hermes 2 Pro - Llama-3 8B", "modalities": { "input": [ "text" @@ -47622,28 +48439,28 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2026-03-12", + "release_date": "2024-05-27", + "last_updated": "2024-06-27", "cost": { - "input": 0.8, - "output": 0.8 + "input": 0.14, + "output": 0.14 }, "type": "chat" }, { - "id": "OpenPipe/Qwen3-14B-Instruct", - "name": "OpenPipe Qwen3 14B Instruct", - "display_name": "OpenPipe Qwen3 14B Instruct", + "id": "nvidia/llama-3.3-nemotron-super-49b-v1.5", + "name": "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5", + "display_name": "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5", "modalities": { "input": [ "text" @@ -47653,28 +48470,29 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 131072, + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2025-03-16", + "last_updated": "2025-03-16", "cost": { - "input": 0.05, - "output": 0.22 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "microsoft/Phi-4-mini-instruct", - "name": "Phi-4-mini-instruct", - "display_name": "Phi-4-mini-instruct", + "id": "nvidia/nemotron-3-super-120b-a12b:free", + "name": "NVIDIA: Nemotron 3 Super (free)", + "display_name": "NVIDIA: Nemotron 3 Super (free)", "modalities": { "input": [ "text" @@ -47684,8 +48502,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -47695,19 +48513,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2026-03-12", + "release_date": "2026-03-12", + "last_updated": "2026-03-15", "cost": { - "input": 0.08, - "output": 0.35 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "nvidia/NVIDIA-Nemotron-3-Super-120B-A12B-FP8", - "name": "NVIDIA Nemotron 3 Super 120B", - "display_name": "NVIDIA Nemotron 3 Super 120B", + "id": "nvidia/nemotron-3-super-120b-a12b", + "name": "NVIDIA: Nemotron 3 Super", + "display_name": "NVIDIA: Nemotron 3 Super", "modalities": { "input": [ "text" @@ -47723,22 +48540,24 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, "release_date": "2026-03-11", - "last_updated": "2026-03-12", + "last_updated": "2026-04-11", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.1, + "output": 0.5, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "nvidia/nemotron-nano-9b-v2", + "name": "NVIDIA: Nemotron Nano 9B V2", + "display_name": "NVIDIA: Nemotron Nano 9B V2", "modalities": { "input": [ "text" @@ -47748,64 +48567,64 @@ ] }, "limit": { - "context": 161000, - "output": 161000 + "context": 131072, + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-08-21", - "last_updated": "2026-03-12", + "release_date": "2025-08-18", + "last_updated": "2025-08-18", "cost": { - "input": 0.55, - "output": 1.65 + "input": 0.04, + "output": 0.16 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "gpt-oss-20b", - "display_name": "gpt-oss-20b", + "id": "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free", + "name": "NVIDIA: Nemotron 3 Nano Omni (free)", + "display_name": "NVIDIA: Nemotron 3 Nano Omni (free)", "modalities": { "input": [ - "text" + "text", + "audio", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2026-03-12", + "release_date": "2026-04-28", + "last_updated": "2026-05-01", "cost": { - "input": 0.05, - "output": 0.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "nvidia/nemotron-3-nano-30b-a3b", + "name": "NVIDIA: Nemotron 3 Nano 30B A3B", + "display_name": "NVIDIA: Nemotron 3 Nano 30B A3B", "modalities": { "input": [ "text" @@ -47815,79 +48634,92 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 52429 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2026-03-12", + "open_weights": true, + "release_date": "2024-12", + "last_updated": "2026-02-04", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.05, + "output": 0.2 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "anthropic/claude-sonnet-4.6", + "name": "Anthropic: Claude Sonnet 4.6", + "display_name": "Anthropic: Claude Sonnet 4.6", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, - "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-03-12", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-15", "cost": { - "input": 0.5, - "output": 2.85 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "anthropic/claude-opus-4.6-fast", + "name": "Anthropic: Claude Opus 4.6 (Fast)", + "display_name": "Anthropic: Claude Opus 4.6 (Fast)", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -47895,36 +48727,62 @@ ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true - } + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-03-12", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-04-07", + "last_updated": "2026-04-11", "cost": { - "input": 0.3, - "output": 1.2 + "input": 30, + "output": 150, + "cache_read": 3, + "cache_write": 37.5 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "anthropic/claude-3-haiku", + "name": "Anthropic: Claude 3 Haiku", + "display_name": "Anthropic: Claude 3 Haiku", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -47932,52 +48790,33 @@ }, "limit": { "context": 200000, - "output": 131072 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "release_date": "2024-03-07", + "last_updated": "2024-03-07", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26, - "cache_write": 0 + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 }, "type": "chat" - } - ] - }, - "chutes": { - "id": "chutes", - "name": "Chutes", - "display_name": "Chutes", - "api": "https://llm.chutes.ai/v1", - "doc": "https://llm.chutes.ai/v1/models", - "models": [ + }, { - "id": "NousResearch/DeepHermes-3-Mistral-24B-Preview", - "name": "DeepHermes 3 Mistral 24B Preview", - "display_name": "DeepHermes 3 Mistral 24B Preview", + "id": "anthropic/claude-sonnet-4.5", + "name": "Anthropic: Claude Sonnet 4.5", + "display_name": "Anthropic: Claude Sonnet 4.5", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -47985,31 +48824,35 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "release_date": "2025-09-29", + "last_updated": "2026-03-15", "cost": { - "input": 0.0245, - "output": 0.0978, - "cache_read": 0.01225 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "NousResearch/Hermes-4-14B", - "name": "Hermes 4 14B", - "display_name": "Hermes 4 14B", + "id": "anthropic/claude-opus-4.7-fast", + "name": "Anthropic: Claude Opus 4.7 (Fast)", + "display_name": "Anthropic: Claude Opus 4.7 (Fast)", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -48017,87 +48860,121 @@ ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], "interleaved": true, "summaries": true, - "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "release_date": "2026-05-12", + "last_updated": "2026-05-16", "cost": { - "input": 0.0136, - "output": 0.0543, - "cache_read": 0.0068 + "input": 30, + "output": 150, + "cache_read": 3, + "cache_write": 37.5 }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "anthropic/claude-opus-4.6", + "name": "Anthropic: Claude Opus 4.6", + "display_name": "Anthropic: Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.06, - "output": 0.22, - "cache_read": 0.03 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "Qwen/Qwen3-32B-TEE", - "name": "Qwen3 32B TEE", - "display_name": "Qwen3 32B TEE", + "id": "anthropic/claude-opus-4.1", + "name": "Anthropic: Claude Opus 4.1", + "display_name": "Anthropic: Claude Opus 4.1", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -48105,8 +48982,8 @@ ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -48114,33 +48991,35 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-25", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2026-03-15", "cost": { - "input": 0.08, - "output": 0.24, - "cache_read": 0.04 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "Qwen/Qwen3.6-27B-TEE", - "name": "Qwen3.6 27B TEE", - "display_name": "Qwen3.6 27B TEE", + "id": "anthropic/claude-opus-4", + "name": "Anthropic: Claude Opus 4", + "display_name": "Anthropic: Claude Opus 4", "modalities": { "input": [ - "text", - "image" + "image", + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -48148,34 +49027,25 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-25", - "last_updated": "2026-04-25", + "open_weights": false, + "release_date": "2025-05-22", + "last_updated": "2026-03-15", "cost": { - "input": 0.195, - "output": 1.56, - "cache_read": 0.0975 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-Coder-32B-Instruct", - "name": "Qwen2.5 Coder 32B Instruct", - "display_name": "Qwen2.5 Coder 32B Instruct", + "id": "anthropic/claude-haiku-4.5", + "name": "Anthropic: Claude Haiku 4.5", + "display_name": "Anthropic: Claude Haiku 4.5", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -48183,31 +49053,35 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.0272, - "output": 0.1087, - "cache_read": 0.0136 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "Qwen/Qwen3Guard-Gen-0.6B", - "name": "Qwen3Guard Gen 0.6B", - "display_name": "Qwen3Guard Gen 0.6B", + "id": "anthropic/claude-opus-4.5", + "name": "Anthropic: Claude Opus 4.5", + "display_name": "Anthropic: Claude Opus 4.5", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -48215,31 +49089,35 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "release_date": "2025-11-24", + "last_updated": "2026-03-15", "cost": { - "input": 0.01, - "output": 0.0109, - "cache_read": 0.005 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "anthropic/claude-sonnet-4", + "name": "Anthropic: Claude Sonnet 4", + "display_name": "Anthropic: Claude Sonnet 4", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -48247,93 +49125,125 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "release_date": "2025-05-22", + "last_updated": "2026-03-15", "cost": { - "input": 0.1, - "output": 0.8, - "cache_read": 0.05 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507-TEE", - "name": "Qwen3 235B A22B Instruct 2507 TEE", - "display_name": "Qwen3 235B A22B Instruct 2507 TEE", + "id": "anthropic/claude-3.5-haiku", + "name": "Anthropic: Claude 3.5 Haiku", + "display_name": "Anthropic: Claude 3.5 Haiku", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.1, - "output": 0.6, - "cache_read": 0.05 + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-Next-TEE", - "name": "Qwen3 Coder Next TEE", - "display_name": "Qwen3 Coder Next TEE", + "id": "anthropic/claude-opus-4.7", + "name": "Anthropic: Claude Opus 4.7", + "display_name": "Anthropic: Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-25", - "last_updated": "2026-04-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-04-16", + "last_updated": "2026-05-01", "cost": { - "input": 0.12, - "output": 0.75, - "cache_read": 0.06 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "inclusionai/ring-2.6-1t", + "name": "inclusionAI: Ring-2.6-1T", + "display_name": "inclusionAI: Ring-2.6-1T", "modalities": { "input": [ "text" @@ -48344,7 +49254,7 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -48352,69 +49262,56 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "open_weights": false, + "release_date": "2026-05-08", + "last_updated": "2026-05-16", "cost": { - "input": 0.11, - "output": 0.6, - "cache_read": 0.055 + "input": 0.075, + "output": 0.625, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-32B-Instruct", - "name": "Qwen2.5 VL 32B Instruct", - "display_name": "Qwen2.5 VL 32B Instruct", + "id": "inclusionai/ling-2.6-1t", + "name": "inclusionAI: Ling-2.6-1T", + "display_name": "inclusionAI: Ling-2.6-1T", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 262144, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": false, + "open_weights": false, + "release_date": "2026-04-23", + "last_updated": "2026-05-16", "cost": { - "input": 0.0543, - "output": 0.2174, - "cache_read": 0.02715 + "input": 0.3, + "output": 2.5, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-397B-A17B-TEE", - "name": "Qwen3.5 397B A17B TEE", - "display_name": "Qwen3.5 397B A17B TEE", + "id": "inclusionai/ling-2.6-flash", + "name": "inclusionAI: Ling-2.6 Flash", + "display_name": "inclusionAI: Ling-2.6 Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -48422,72 +49319,60 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-18", - "last_updated": "2026-04-25", + "attachment": false, + "open_weights": false, + "release_date": "2026-04-21", + "last_updated": "2026-05-01", "cost": { - "input": 0.39, - "output": 2.34, - "cache_read": 0.195 + "input": 0.08, + "output": 0.24, + "cache_read": 0.016 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-72B-Instruct", - "name": "Qwen2.5 72B Instruct", - "display_name": "Qwen2.5 72B Instruct", + "id": "mistralai/mistral-large-2512", + "name": "Mistral: Mistral Large 3 2512", + "display_name": "Mistral: Mistral Large 3 2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 262144, + "output": 52429 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2024-11-01", + "last_updated": "2025-12-16", "cost": { - "input": 0.2989, - "output": 1.1957, - "cache_read": 0.14945 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1-TEE", - "name": "GLM 5.1 TEE", - "display_name": "GLM 5.1 TEE", + "id": "mistralai/mistral-7b-instruct-v0.1", + "name": "Mistral: Mistral 7B Instruct v0.1", + "display_name": "Mistral: Mistral 7B Instruct v0.1", "modalities": { "input": [ "text" @@ -48497,41 +49382,28 @@ ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 2824, + "output": 565 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-08", - "last_updated": "2026-04-25", + "open_weights": false, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", "cost": { - "input": 1.05, - "output": 3.5, - "cache_read": 0.525 + "input": 0.11, + "output": 0.19 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7-FP8", - "name": "GLM 4.7 FP8", - "display_name": "GLM 4.7 FP8", + "id": "mistralai/mistral-large-2411", + "name": "Mistral Large 2411", + "display_name": "Mistral Large 2411", "modalities": { "input": [ "text" @@ -48541,30 +49413,28 @@ ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 131072, + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-04-25", + "release_date": "2024-07-24", + "last_updated": "2024-11-04", "cost": { - "input": 0.2989, - "output": 1.1957, - "cache_read": 0.14945 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "zai-org/GLM-5-TEE", - "name": "GLM 5 TEE", - "display_name": "GLM 5 TEE", + "id": "mistralai/mistral-saba", + "name": "Mistral: Saba", + "display_name": "Mistral: Saba", "modalities": { "input": [ "text" @@ -48574,41 +49444,28 @@ ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-14", - "last_updated": "2026-04-25", + "release_date": "2025-02-17", + "last_updated": "2026-03-15", "cost": { - "input": 0.95, - "output": 2.55, - "cache_read": 0.475 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7-TEE", - "name": "GLM 4.7 TEE", - "display_name": "GLM 4.7 TEE", + "id": "mistralai/codestral-2508", + "name": "Mistral: Codestral 2508", + "display_name": "Mistral: Codestral 2508", "modalities": { "input": [ "text" @@ -48618,45 +49475,32 @@ ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 256000, + "output": 51200 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2025-08-01", + "last_updated": "2025-08-01", "cost": { - "input": 0.39, - "output": 1.75, - "cache_read": 0.195 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6V", - "name": "GLM 4.6V", - "display_name": "GLM 4.6V", + "id": "mistralai/mistral-small-3.2-24b-instruct", + "name": "Mistral: Mistral Small 3.2 24B", + "display_name": "Mistral: Mistral Small 3.2 24B", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" @@ -48664,42 +49508,31 @@ }, "limit": { "context": 131072, - "output": 65536 + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2025-06-20", + "last_updated": "2025-06-20", "cost": { - "input": 0.3, - "output": 0.9, - "cache_read": 0.15 + "input": 0.06, + "output": 0.18, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "zai-org/GLM-5-Turbo", - "name": "GLM 5 Turbo", - "display_name": "GLM 5 Turbo", + "id": "mistralai/mistral-small-2603", + "name": "Mistral: Mistral Small 4", + "display_name": "Mistral: Mistral Small 4", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -48707,8 +49540,8 @@ ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -48716,32 +49549,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-03-11", - "last_updated": "2026-04-25", + "release_date": "2026-03-16", + "last_updated": "2026-04-11", "cost": { - "input": 0.4891, - "output": 1.9565, - "cache_read": 0.24455 + "input": 0.15, + "output": 0.6, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "XiaomiMiMo/MiMo-V2-Flash-TEE", - "name": "MiMo V2 Flash TEE", - "display_name": "MiMo V2 Flash TEE", + "id": "mistralai/mistral-nemo", + "name": "Mistral: Mistral Nemo", + "display_name": "Mistral: Mistral Nemo", "modalities": { "input": [ "text" @@ -48751,8 +49573,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -48761,19 +49583,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-04-25", - "last_updated": "2026-04-25", + "release_date": "2024-07-01", + "last_updated": "2024-07-30", "cost": { - "input": 0.09, - "output": 0.29, - "cache_read": 0.045 + "input": 0.02, + "output": 0.04 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "mistralai/devstral-2512", + "name": "Mistral: Devstral 2 2512", + "display_name": "Mistral: Devstral 2 2512", "modalities": { "input": [ "text" @@ -48783,43 +49604,32 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2025-09-12", + "last_updated": "2026-03-15", "cost": { - "input": 0.0272, - "output": 0.1087, - "cache_read": 0.0136 + "input": 0.4, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1-TEE", - "name": "DeepSeek V3.1 TEE", - "display_name": "DeepSeek V3.1 TEE", + "id": "mistralai/mistral-medium-3-5", + "name": "Mistral: Mistral Medium 3.5", + "display_name": "Mistral: Mistral Medium 3.5", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -48827,8 +49637,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -48836,64 +49646,52 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-30", + "last_updated": "2026-05-07", "cost": { - "input": 0.27, - "output": 1, - "cache_read": 0.135 + "input": 1.5, + "output": 7.5 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3-0324-TEE", - "name": "DeepSeek V3 0324 TEE", - "display_name": "DeepSeek V3 0324 TEE", + "id": "mistralai/ministral-14b-2512", + "name": "Mistral: Ministral 3 14B 2512", + "display_name": "Mistral: Ministral 3 14B 2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 262144, + "output": 52429 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 0.25, - "output": 1, - "cache_read": 0.125 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528-TEE", - "name": "DeepSeek R1 0528 TEE", - "display_name": "DeepSeek R1 0528 TEE", + "id": "mistralai/mixtral-8x22b-instruct", + "name": "Mistral: Mixtral 8x22B Instruct", + "display_name": "Mistral: Mixtral 8x22B Instruct", "modalities": { "input": [ "text" @@ -48903,85 +49701,60 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 65536, + "output": 13108 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2024-04-17", + "last_updated": "2024-04-17", "cost": { - "input": 0.45, - "output": 2.15, - "cache_read": 0.225 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2-TEE", - "name": "DeepSeek V3.2 TEE", - "display_name": "DeepSeek V3.2 TEE", + "id": "mistralai/voxtral-small-24b-2507", + "name": "Mistral: Voxtral Small 24B 2507", + "display_name": "Mistral: Voxtral Small 24B 2507", "modalities": { "input": [ - "text" + "text", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 32000, + "output": 6400 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.28, - "output": 0.42, - "cache_read": 0.14 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b-TEE", - "name": "gpt oss 120b TEE", - "display_name": "gpt oss 120b TEE", + "id": "mistralai/devstral-medium", + "name": "Mistral: Devstral Medium", + "display_name": "Mistral: Devstral Medium", "modalities": { "input": [ "text" @@ -48992,44 +49765,31 @@ }, "limit": { "context": 131072, - "output": 65536 + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2025-07-10", + "last_updated": "2025-07-10", "cost": { - "input": 0.09, - "output": 0.36, - "cache_read": 0.045 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "unsloth/gemma-3-12b-it", - "name": "gemma 3 12b it", - "display_name": "gemma 3 12b it", + "id": "mistralai/pixtral-large-2411", + "name": "Mistral: Pixtral Large 2411", + "display_name": "Mistral: Pixtral Large 2411", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" @@ -49037,28 +49797,27 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2024-11-19", + "last_updated": "2026-03-15", "cost": { - "input": 0.03, - "output": 0.1, - "cache_read": 0.015 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "unsloth/Llama-3.2-3B-Instruct", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "mistralai/mistral-large-2407", + "name": "Mistral Large 2407", + "display_name": "Mistral Large 2407", "modalities": { "input": [ "text" @@ -49068,29 +49827,91 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-02-12", - "last_updated": "2026-04-25", + "release_date": "2024-11-19", + "last_updated": "2026-03-15", "cost": { - "input": 0.01, - "output": 0.0136, - "cache_read": 0.005 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "unsloth/gemma-3-4b-it", - "name": "gemma 3 4b it", - "display_name": "gemma 3 4b it", + "id": "mistralai/mistral-large", + "name": "Mistral Large", + "display_name": "Mistral Large", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 25600 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-07-24", + "last_updated": "2025-12-02", + "cost": { + "input": 2, + "output": 6 + }, + "type": "chat" + }, + { + "id": "mistralai/ministral-3b-2512", + "name": "Mistral: Ministral 3 3B 2512", + "display_name": "Mistral: Ministral 3 3B 2512", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-12-02", + "last_updated": "2026-03-15", + "cost": { + "input": 0.1, + "output": 0.1 + }, + "type": "chat" + }, + { + "id": "mistralai/mistral-medium-3", + "name": "Mistral: Mistral Medium 3", + "display_name": "Mistral: Mistral Medium 3", "modalities": { "input": [ "text", @@ -49101,29 +49922,28 @@ ] }, "limit": { - "context": 96000, - "output": 96000 + "context": 131072, + "output": 26215 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "open_weights": false, + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0.01, - "output": 0.0272, - "cache_read": 0.005 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "unsloth/Llama-3.2-1B-Instruct", - "name": "Llama 3.2 1B Instruct", - "display_name": "Llama 3.2 1B Instruct", + "id": "mistralai/mistral-small-24b-instruct-2501", + "name": "Mistral: Mistral Small 3", + "display_name": "Mistral: Mistral Small 3", "modalities": { "input": [ "text" @@ -49133,29 +49953,28 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 32768, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-04-25", + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.01, - "output": 0.0109, - "cache_read": 0.005 + "input": 0.05, + "output": 0.08 }, "type": "chat" }, { - "id": "unsloth/Mistral-Nemo-Instruct-2407", - "name": "Mistral Nemo Instruct 2407", - "display_name": "Mistral Nemo Instruct 2407", + "id": "mistralai/devstral-small", + "name": "Mistral: Devstral Small 1.1", + "display_name": "Mistral: Devstral Small 1.1", "modalities": { "input": [ "text" @@ -49166,40 +49985,39 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 26215 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2025-05-07", + "last_updated": "2025-07-10", "cost": { - "input": 0.02, - "output": 0.04, - "cache_read": 0.01 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "unsloth/gemma-3-27b-it", - "name": "gemma 3 27b it", - "display_name": "gemma 3 27b it", + "id": "mistralai/ministral-8b-2512", + "name": "Mistral: Ministral 3 8B 2512", + "display_name": "Mistral: Ministral 3 8B 2512", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -49208,19 +50026,18 @@ }, "attachment": true, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2025-12-02", + "last_updated": "2026-03-15", "cost": { - "input": 0.0272, - "output": 0.1087, - "cache_read": 0.0136 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "google/gemma-4-31B-turbo-TEE", - "name": "gemma 4 31B turbo TEE", - "display_name": "gemma 4 31B turbo TEE", + "id": "mistralai/mistral-medium-3.1", + "name": "Mistral: Mistral Medium 3.1", + "display_name": "Mistral: Mistral Medium 3.1", "modalities": { "input": [ "text", @@ -49232,89 +50049,72 @@ }, "limit": { "context": 131072, - "output": 65536 + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-25", - "last_updated": "2026-04-25", + "open_weights": false, + "release_date": "2025-08-12", + "last_updated": "2025-08-12", "cost": { - "input": 0.13, - "output": 0.38, - "cache_read": 0.065 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6-TEE", - "name": "Kimi K2.6 TEE", - "display_name": "Kimi K2.6 TEE", + "id": "mistralai/mistral-small-3.1-24b-instruct", + "name": "Mistral: Mistral Small 3.1 24B", + "display_name": "Mistral: Mistral Small 3.1 24B", "modalities": { "input": [ - "text", "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65535 + "context": 128000, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-04-20", - "last_updated": "2026-04-25", + "release_date": "2025-03-17", + "last_updated": "2026-03-15", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.475 + "input": 0.35, + "output": 0.56, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5-TEE", - "name": "Kimi K2.5 TEE", - "display_name": "Kimi K2.5 TEE", + "id": "qwen/qwen3-vl-8b-thinking", + "name": "Qwen: Qwen3 VL 8B Thinking", + "display_name": "Qwen: Qwen3 VL 8B Thinking", "modalities": { "input": [ - "text", "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65535 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -49334,21 +50134,19 @@ } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2026-01-27", - "last_updated": "2026-04-25", + "open_weights": false, + "release_date": "2025-10-15", + "last_updated": "2025-11-25", "cost": { - "input": 0.44, - "output": 2, - "cache_read": 0.22 + "input": 0.117, + "output": 1.365 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5-TEE", - "name": "MiniMax M2.5 TEE", - "display_name": "MiniMax M2.5 TEE", + "id": "qwen/qwen3-30b-a3b-instruct-2507", + "name": "Qwen: Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen: Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ "text" @@ -49358,7 +50156,41 @@ ] }, "limit": { - "context": 196608, + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-07-29", + "last_updated": "2026-03-15", + "cost": { + "input": 0.09, + "output": 0.3, + "cache_read": 0.04 + }, + "type": "chat" + }, + { + "id": "qwen/qwen3.5-plus-20260420", + "name": "Qwen: Qwen3.5 Plus 2026-04-20", + "display_name": "Qwen: Qwen3.5 Plus 2026-04-20", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, "output": 65536 }, "temperature": true, @@ -49378,21 +50210,20 @@ ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-15", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-27", + "last_updated": "2026-05-01", "cost": { - "input": 0.15, - "output": 1.2, - "cache_read": 0.075 + "input": 0.4, + "output": 2.4 }, "type": "chat" }, { - "id": "rednote-hilab/dots.ocr", - "name": "dots.ocr", - "display_name": "dots.ocr", + "id": "qwen/qwen3-vl-235b-a22b-instruct", + "name": "Qwen: Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen: Qwen3 VL 235B A22B Instruct", "modalities": { "input": [ "text", @@ -49403,40 +50234,42 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 52429 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2025-09-23", + "last_updated": "2026-01-10", "cost": { - "input": 0.01, - "output": 0.0109, - "cache_read": 0.005 + "input": 0.2, + "output": 0.88, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "tngtech/DeepSeek-TNG-R1T2-Chimera-TEE", - "name": "DeepSeek TNG R1T2 Chimera TEE", - "display_name": "DeepSeek TNG R1T2 Chimera TEE", + "id": "qwen/qwen3.6-27b", + "name": "Qwen: Qwen3.6 27B", + "display_name": "Qwen: Qwen3.6 27B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -49444,32 +50277,34 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-25", - "last_updated": "2026-04-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-04-27", + "last_updated": "2026-05-01", "cost": { - "input": 0.3, - "output": 1.1, - "cache_read": 0.15 + "input": 0.325, + "output": 3.25 }, "type": "chat" - } - ] - }, - "dinference": { - "id": "dinference", - "name": "DInference", - "display_name": "DInference", - "api": "https://api.dinference.com/v1", - "doc": "https://dinference.com", - "models": [ + }, { - "id": "gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "qwen/qwen2.5-vl-72b-instruct", + "name": "Qwen: Qwen2.5 VL 72B Instruct", + "display_name": "Qwen: Qwen2.5 VL 72B Instruct", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -49477,44 +50312,42 @@ ] }, "limit": { - "context": 131072, + "context": 32768, "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-08", - "last_updated": "2025-08", + "release_date": "2025-02-01", + "last_updated": "2026-03-15", "cost": { - "input": 0.0675, - "output": 0.27 + "input": 0.8, + "output": 0.8, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "qwen/qwen3.5-plus-02-15", + "name": "Qwen: Qwen3.5 Plus 2026-02-15", + "display_name": "Qwen: Qwen3.5 Plus 2026-02-15", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -49533,23 +50366,23 @@ ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "attachment": true, + "open_weights": false, + "release_date": "2026-02-15", + "last_updated": "2026-03-15", "cost": { - "input": 0.45, - "output": 1.65 + "input": 0.26, + "output": 1.56 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "qwen/qwen3-vl-235b-a22b-thinking", + "name": "Qwen: Qwen3 VL 235B A22B Thinking", + "display_name": "Qwen: Qwen3 VL 235B A22B Thinking", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -49557,8 +50390,8 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -49577,20 +50410,20 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2025-09-24", + "last_updated": "2026-03-15", "cost": { - "input": 0.75, - "output": 2.4 + "input": 0.26, + "output": 2.6 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "qwen/qwen3-8b", + "name": "Qwen: Qwen3 8B", + "display_name": "Qwen: Qwen3 8B", "modalities": { "input": [ "text" @@ -49600,8 +50433,8 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 40960, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -49621,19 +50454,20 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "open_weights": true, + "release_date": "2025-04", + "last_updated": "2026-03-15", "cost": { - "input": 1.25, - "output": 3.89 + "input": 0.05, + "output": 0.4, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "qwen/qwen-2.5-72b-instruct", + "name": "Qwen2.5 72B Instruct", + "display_name": "Qwen2.5 72B Instruct", "modalities": { "input": [ "text" @@ -49643,114 +50477,84 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2024-09", + "last_updated": "2026-01-10", "cost": { - "input": 0.22, - "output": 0.88 + "input": 0.12, + "output": 0.39 }, "type": "chat" - } - ] - }, - "vivgrid": { - "id": "vivgrid", - "name": "Vivgrid", - "display_name": "Vivgrid", - "api": "https://api.vivgrid.com/v1", - "doc": "https://docs.vivgrid.com/models", - "models": [ + }, { - "id": "gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "qwen/qwen3.5-122b-a10b", + "name": "Qwen: Qwen3.5-122B-A10B", + "display_name": "Qwen: Qwen3.5-122B-A10B", "modalities": { "input": [ + "image", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": true, + "open_weights": true, + "release_date": "2026-02-26", + "last_updated": "2026-03-15", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.26, + "output": 2.08 }, "type": "chat" }, { - "id": "gemini-3.1-flash-lite-preview", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "qwen/qwen-plus-2025-07-28:thinking", + "name": "Qwen: Qwen Plus 0728 (thinking)", + "display_name": "Qwen: Qwen Plus 0728 (thinking)", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -49758,43 +50562,31 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "attachment": false, + "open_weights": true, + "release_date": "2025-09-09", + "last_updated": "2026-03-15", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "input": 0.26, + "output": 0.78 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "qwen/qwen3-max-thinking", + "name": "Qwen: Qwen3 Max Thinking", + "display_name": "Qwen: Qwen3 Max Thinking", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -49805,383 +50597,269 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "release_date": "2026-01-23", + "last_updated": "2026-03-15", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.78, + "output": 3.9 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "qwen/qwen3-max", + "name": "Qwen: Qwen3 Max", + "display_name": "Qwen: Qwen3 Max", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 262144, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-09-05", + "last_updated": "2026-03-15", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 + "input": 1.2, + "output": 6, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "qwen/qwen3-235b-a22b-2507", + "name": "Qwen: Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen: Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 52429 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": false, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "open_weights": true, + "release_date": "2025-04", + "last_updated": "2026-01", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.071, + "output": 0.1 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 Mini", - "display_name": "GPT-5.4 Mini", + "id": "qwen/qwen3-235b-a22b", + "name": "Qwen: Qwen3 235B A22B", + "display_name": "Qwen: Qwen3 235B A22B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "release_date": "2024-12-01", + "last_updated": "2026-03-15", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 0.455, + "output": 1.82, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "gpt-5.4-nano", - "name": "GPT-5.4 Nano", - "display_name": "GPT-5.4 Nano", + "id": "qwen/qwen3.5-397b-a17b", + "name": "Qwen: Qwen3.5 397B A17B", + "display_name": "Qwen: Qwen3.5 397B A17B", "modalities": { "input": [ - "text", "image", - "pdf" + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "release_date": "2026-02-15", + "last_updated": "2026-03-15", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 0.39, + "output": 2.34 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "qwen/qwen-2.5-coder-32b-instruct", + "name": "Qwen2.5 Coder 32B Instruct", + "display_name": "Qwen2.5 Coder 32B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32768, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "open_weights": true, + "release_date": "2024-11-11", + "last_updated": "2026-03-15", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.2, + "output": 0.2, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "qwen/qwen3.5-9b", + "name": "Qwen: Qwen3.5-9B", + "display_name": "Qwen: Qwen3.5-9B", "modalities": { "input": [ - "text", "image", - "pdf" + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "open_weights": true, + "release_date": "2026-03-10", + "last_updated": "2026-03-15", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 0.05, + "output": 0.15 }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "qwen/qwen3-coder-next", + "name": "Qwen: Qwen3 Coder Next", + "display_name": "Qwen: Qwen3 Coder Next", "modalities": { "input": [ "text" @@ -50191,106 +50869,75 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2026-02-02", + "last_updated": "2026-03-15", "cost": { - "input": 0.28, - "output": 0.42 + "input": 0.12, + "output": 0.75, + "cache_read": 0.035 }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "qwen/qwen3-coder", + "name": "Qwen: Qwen3 Coder 480B A35B", + "display_name": "Qwen: Qwen3 Coder 480B A35B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 52429 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": true, + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.22, + "output": 1, + "cache_read": 0.022 }, "type": "chat" }, { - "id": "gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "qwen/qwen3.6-plus", + "name": "Qwen: Qwen3.6 Plus", + "display_name": "Qwen: Qwen3.6 Plus", "modalities": { "input": [ - "text", "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 1000000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -50299,45 +50946,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "release_date": "2025-08-26", + "last_updated": "2026-04-11", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 0.325, + "output": 1.95, + "cache_read": 0.0325, + "cache_write": 0.40625 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "qwen/qwen3-coder-flash", + "name": "Qwen: Qwen3 Coder Flash", + "display_name": "Qwen: Qwen3 Coder Flash", "modalities": { "input": [ "text" @@ -50348,62 +50980,39 @@ }, "limit": { "context": 1000000, - "output": 384000 + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "open_weights": false, + "release_date": "2025-07-23", + "last_updated": "2026-03-15", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 0.195, + "output": 0.975, + "cache_read": 0.06 }, "type": "chat" - } - ] - }, - "deepinfra": { - "id": "deepinfra", - "name": "Deep Infra", - "display_name": "Deep Infra", - "doc": "https://deepinfra.com/models", - "models": [ + }, { - "id": "Qwen/Qwen3.5-397B-A17B", - "name": "Qwen 3.5 397B A17B", - "display_name": "Qwen 3.5 397B A17B", + "id": "qwen/qwen3-30b-a3b-thinking-2507", + "name": "Qwen: Qwen3 30B A3B Thinking 2507", + "display_name": "Qwen: Qwen3 30B A3B Thinking 2507", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 81920 + "context": 32768, + "output": 6554 }, "temperature": true, "tool_call": true, @@ -50422,34 +51031,31 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-01", - "last_updated": "2026-04-20", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 0.54, - "output": 3.4 + "input": 0.051, + "output": 0.34 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-35B-A3B", - "name": "Qwen 3.5 35B A3B", - "display_name": "Qwen 3.5 35B A3B", + "id": "qwen/qwen3-32b", + "name": "Qwen: Qwen3 32B", + "display_name": "Qwen: Qwen3 32B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 81920 + "context": 40960, + "output": 40960 }, "temperature": true, "tool_call": true, @@ -50468,53 +51074,21 @@ ] } }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-01", - "last_updated": "2026-04-20", - "cost": { - "input": 0.2, - "output": 0.95 - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo", - "name": "Qwen3 Coder 480B A35B Instruct Turbo", - "display_name": "Qwen3 Coder 480B A35B Instruct Turbo", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 66536 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "release_date": "2024-12-01", + "last_updated": "2026-02-04", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.08, + "output": 0.24, + "cache_read": 0.04 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen: Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen: Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ "text" @@ -50524,33 +51098,44 @@ ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "release_date": "2025-09-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.4, - "output": 1.6 + "input": 0.0975, + "output": 0.78 }, "type": "chat" }, { - "id": "Qwen/Qwen3.6-35B-A3B", - "name": "Qwen3.6 35B A3B", - "display_name": "Qwen3.6 35B A3B", + "id": "qwen/qwen3.5-flash-02-23", + "name": "Qwen: Qwen3.5-Flash", + "display_name": "Qwen: Qwen3.5-Flash", "modalities": { "input": [ - "text", "image", + "text", "video" ], "output": [ @@ -50558,8 +51143,8 @@ ] }, "limit": { - "context": 262144, - "output": 81920 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -50580,18 +51165,18 @@ }, "attachment": true, "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "release_date": "2026-02-26", + "last_updated": "2026-03-15", "cost": { - "input": 0.2, - "output": 1 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7-Flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "qwen/qwen3-30b-a3b", + "name": "Qwen: Qwen3 30B A3B", + "display_name": "Qwen: Qwen3 30B A3B", "modalities": { "input": [ "text" @@ -50601,8 +51186,8 @@ ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 40960, + "output": 40960 }, "temperature": true, "tool_call": true, @@ -50623,21 +51208,22 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "release_date": "2025-04", + "last_updated": "2026-03-15", "cost": { - "input": 0.06, - "output": 0.4 + "input": 0.08, + "output": 0.28, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "qwen/qwen3-vl-30b-a3b-thinking", + "name": "Qwen: Qwen3 VL 30B A3B Thinking", + "display_name": "Qwen: Qwen3 VL 30B A3B Thinking", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -50646,39 +51232,52 @@ }, "limit": { "context": 131072, - "output": 98304 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-10-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0.13, + "output": 1.56 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "qwen/qwen3.5-35b-a3b", + "name": "Qwen: Qwen3.5-35B-A3B", + "display_name": "Qwen: Qwen3.5-35B-A3B", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -50697,36 +51296,36 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2026-02-26", + "last_updated": "2026-03-15", "cost": { - "input": 0.43, - "output": 1.75, - "cache_read": 0.08 + "input": 0.1625, + "output": 1.3 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "qwen/qwen3.6-35b-a3b", + "name": "Qwen: Qwen3.6 35B A3B", + "display_name": "Qwen: Qwen3.6 35B A3B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 262144, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -50742,22 +51341,21 @@ ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-04-07", - "last_updated": "2026-04-07", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-27", + "last_updated": "2026-05-01", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 0.1612, + "output": 0.96525, + "cache_read": 0.1612 }, "type": "chat" }, { - "id": "zai-org/GLM-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "qwen/qwen-plus-2025-07-28", + "name": "Qwen: Qwen Plus 0728", + "display_name": "Qwen: Qwen Plus 0728", "modalities": { "input": [ "text" @@ -50767,14 +51365,13 @@ ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -50789,32 +51386,61 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2025-09-09", + "last_updated": "2026-03-15", "cost": { - "input": 0.8, - "output": 2.56, - "cache_read": 0.16 + "input": 0.26, + "output": 0.78 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6V", - "name": "GLM-4.6V", - "display_name": "GLM-4.6V", + "id": "qwen/qwen3-vl-8b-instruct", + "name": "Qwen: Qwen3 VL 8B Instruct", + "display_name": "Qwen: Qwen3 VL 8B Instruct", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-10-15", + "last_updated": "2025-11-25", + "cost": { + "input": 0.08, + "output": 0.5 + }, + "type": "chat" + }, + { + "id": "qwen/qwen3-235b-a22b-thinking-2507", + "name": "Qwen: Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen: Qwen3 235B A22B Thinking 2507", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -50833,21 +51459,20 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "release_date": "2025-07-25", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.11, + "output": 0.6 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "qwen/qwen3.6-max-preview", + "name": "Qwen: Qwen3.6 Max Preview", + "display_name": "Qwen: Qwen3.6 Max Preview", "modalities": { "input": [ "text" @@ -50857,8 +51482,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -50878,52 +51503,51 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "open_weights": false, + "release_date": "2026-04-27", + "last_updated": "2026-05-01", "cost": { - "input": 0.43, - "output": 1.74, - "cache_read": 0.08 + "input": 1.04, + "output": 6.24, + "cache_write": 1.3 }, "type": "chat" }, { - "id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", - "name": "Llama 4 Scout 17B", - "display_name": "Llama 4 Scout 17B", + "id": "qwen/qwen3-coder-30b-a3b-instruct", + "name": "Qwen: Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen: Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 10000000, - "output": 16384 + "context": 160000, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "cost": { - "input": 0.08, - "output": 0.3 + "input": 0.07, + "output": 0.27 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.1-8B-Instruct", - "name": "Llama 3.1 8B", - "display_name": "Llama 3.1 8B", + "id": "qwen/qwen3-next-80b-a3b-instruct", + "name": "Qwen: Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen: Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ "text" @@ -50934,89 +51558,122 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 52429 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2025-09-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.02, - "output": 0.05 + "input": 0.09, + "output": 1.1 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.1-70B-Instruct", - "name": "Llama 3.1 70B", - "display_name": "Llama 3.1 70B", + "id": "qwen/qwen3.5-27b", + "name": "Qwen: Qwen3.5-27B", + "display_name": "Qwen: Qwen3.5-27B", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2026-02-26", + "last_updated": "2026-03-15", "cost": { - "input": 0.4, - "output": 0.4 + "input": 0.195, + "output": 1.56 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.1-8B-Instruct-Turbo", - "name": "Llama 3.1 8B Turbo", - "display_name": "Llama 3.1 8B Turbo", + "id": "qwen/qwen3.6-flash", + "name": "Qwen: Qwen3.6 Flash", + "display_name": "Qwen: Qwen3.6 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1000000, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-04-27", + "last_updated": "2026-05-01", "cost": { - "input": 0.02, - "output": 0.03 + "input": 0.25, + "output": 1.5, + "cache_write": 0.3125 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct-Turbo", - "name": "Llama 3.3 70B Turbo", - "display_name": "Llama 3.3 70B Turbo", + "id": "qwen/qwen3-vl-30b-a3b-instruct", + "name": "Qwen: Qwen3 VL 30B A3B Instruct", + "display_name": "Qwen: Qwen3 VL 30B A3B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -51024,30 +51681,30 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-10-05", + "last_updated": "2025-11-25", "cost": { - "input": 0.1, - "output": 0.32 + "input": 0.13, + "output": 0.52 }, "type": "chat" }, { - "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", - "name": "Llama 4 Maverick 17B FP8", - "display_name": "Llama 4 Maverick 17B FP8", + "id": "qwen/qwen-plus", + "name": "Qwen: Qwen-Plus", + "display_name": "Qwen: Qwen-Plus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -51055,26 +51712,39 @@ }, "limit": { "context": 1000000, - "output": 16384 + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "release_date": "2024-01-25", + "last_updated": "2025-09-11", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.4, + "output": 1.2, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.1-70B-Instruct-Turbo", - "name": "Llama 3.1 70B Turbo", - "display_name": "Llama 3.1 70B Turbo", + "id": "qwen/qwen3-coder-plus", + "name": "Qwen: Qwen3 Coder Plus", + "display_name": "Qwen: Qwen3 Coder Plus", "modalities": { "input": [ "text" @@ -51084,27 +51754,29 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1000000, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2025-07-01", + "last_updated": "2026-03-15", "cost": { - "input": 0.4, - "output": 0.4 + "input": 0.65, + "output": 3.25, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "qwen/qwen-2.5-7b-instruct", + "name": "Qwen: Qwen2.5 7B Instruct", + "display_name": "Qwen: Qwen2.5 7B Instruct", "modalities": { "input": [ "text" @@ -51114,42 +51786,28 @@ ] }, "limit": { - "context": 163840, - "output": 64000 + "context": 32768, + "output": 6554 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": true, + "release_date": "2024-09", + "last_updated": "2025-04-16", "cost": { - "input": 0.5, - "output": 2.15, - "cache_read": 0.35 + "input": 0.04, + "output": 0.1 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "qwen/qwen3-14b", + "name": "Qwen: Qwen3 14B", + "display_name": "Qwen: Qwen3 14B", "modalities": { "input": [ "text" @@ -51159,8 +51817,8 @@ ] }, "limit": { - "context": 163840, - "output": 64000 + "context": 40960, + "output": 40960 }, "temperature": true, "tool_call": true, @@ -51180,24 +51838,24 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "open_weights": true, + "release_date": "2025-04", + "last_updated": "2026-03-15", "cost": { - "input": 0.26, - "output": 0.38, - "cache_read": 0.13 + "input": 0.06, + "output": 0.24, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "qwen/qwen3-vl-32b-instruct", + "name": "Qwen: Qwen3 VL 32B Instruct", + "display_name": "Qwen: Qwen3 VL 32B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -51205,33 +51863,27 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-21", + "last_updated": "2025-11-25", "cost": { - "input": 0.03, - "output": 0.14 + "input": 0.104, + "output": 0.416 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "tencent/hy3-preview", + "name": "Tencent: Hy3 Preview", + "display_name": "Tencent: Hy3 Preview", "modalities": { "input": [ "text" @@ -51241,8 +51893,8 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -51250,25 +51902,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "release_date": "2026-04-22", + "last_updated": "2026-05-16", "cost": { - "input": 0.05, - "output": 0.24 + "input": 0.066, + "output": 0.26, + "cache_read": 0.029 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "tencent/hunyuan-a13b-instruct", + "name": "Tencent: Hunyuan A13B Instruct", + "display_name": "Tencent: Hunyuan A13B Instruct", "modalities": { "input": [ "text" @@ -51279,56 +51927,44 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-11-06", - "last_updated": "2025-11-07", + "open_weights": false, + "release_date": "2025-06-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.47, - "output": 2 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "google/gemini-3-pro-image-preview", + "name": "Google: Nano Banana Pro (Gemini 3 Pro Image Preview)", + "display_name": "Google: Nano Banana Pro (Gemini 3 Pro Image Preview)", "modalities": { "input": [ - "text", "image", - "video" + "text" ], "output": [ + "image", "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 65536, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -51336,99 +51972,119 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "open_weights": false, + "release_date": "2025-11-20", + "last_updated": "2026-03-15", "cost": { - "input": 0.75, - "output": 3.5, - "cache_read": 0.15 + "input": 2, + "output": 12, + "reasoning": 12 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "moonshotai/Kimi-K2-Instruct", - "name": "Kimi K2", - "display_name": "Kimi K2", + "id": "google/gemma-4-26b-a4b-it", + "name": "Google: Gemma 4 26B A4B", + "display_name": "Google: Gemma 4 26B A4B", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "release_date": "2026-04-03", + "last_updated": "2026-04-11", "cost": { - "input": 0.5, - "output": 2 + "input": 0.12, + "output": 0.4 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "google/gemini-3.1-flash-lite", + "name": "Google: Gemini 3.1 Flash Lite", + "display_name": "Google: Gemini 3.1 Flash Lite", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-05-07", + "last_updated": "2026-05-16", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.15 + "input": 0.25, + "output": 1.5, + "reasoning": 1.5, + "cache_read": 0.025, + "cache_write": 0.08333 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "google/gemini-2.5-pro", + "name": "Google: Gemini 2.5 Pro", + "display_name": "Google: Gemini 2.5 Pro", "modalities": { "input": [ - "text", + "audio", "image", + "pdf", + "text", "video" ], "output": [ @@ -51436,8 +52092,8 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -51448,31 +52104,42 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "open_weights": false, + "release_date": "2025-03-20", + "last_updated": "2026-03-15", "cost": { - "input": 0.5, - "output": 2.8 + "input": 1.25, + "output": 10, + "reasoning": 10, + "cache_read": 0.125, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2", - "name": "MiniMax M2", - "display_name": "MiniMax M2", + "id": "google/gemma-3-27b-it", + "name": "Google: Gemma 3 27B", + "display_name": "Google: Gemma 3 27B", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -51480,51 +52147,41 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-03-12", + "last_updated": "2026-03-15", "cost": { - "input": 0.254, - "output": 1.02 + "input": 0.03, + "output": 0.11, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "google/gemma-4-31b-it", + "name": "Google: Gemma 4 31B", + "display_name": "Google: Gemma 4 31B", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 204800, + "context": 262144, "output": 131072 }, "temperature": true, @@ -51533,178 +52190,162 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2026-04-02", + "last_updated": "2026-04-11", "cost": { - "input": 0.27, - "output": 0.95, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 0.14, + "output": 0.4 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.1", - "name": "MiniMax M2.1", - "display_name": "MiniMax M2.1", + "id": "google/gemini-3.1-flash-image-preview", + "name": "Google: Nano Banana 2 (Gemini 3.1 Flash Image Preview)", + "display_name": "Google: Nano Banana 2 (Gemini 3.1 Flash Image Preview)", "modalities": { "input": [ + "image", "text" ], "output": [ + "image", "text" ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 65536, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "attachment": true, + "open_weights": false, + "release_date": "2026-02-26", + "last_updated": "2026-03-15", "cost": { - "input": 0.28, - "output": 1.2 + "input": 0.5, + "output": 3 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "anthropic/claude-3-7-sonnet-latest", - "name": "Claude Sonnet 3.7 (Latest)", - "display_name": "Claude Sonnet 3.7 (Latest)", + "id": "google/gemini-2.5-pro-preview", + "name": "Google: Gemini 2.5 Pro Preview 06-05", + "display_name": "Google: Gemini 2.5 Pro Preview 06-05", "modalities": { "input": [ - "text", - "image" + "audio", + "image", + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "budget", "budget": { - "min": 1024, + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, "unit": "tokens" }, - "interleaved": false, - "summaries": false, - "visibility": "full", + "summaries": true, + "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "release_date": "2025-06-05", + "last_updated": "2026-03-15", "cost": { - "input": 3.3, - "output": 16.5, - "cache_read": 0.33 + "input": 1.25, + "output": 10, + "reasoning": 10, + "cache_read": 0.125, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "anthropic/claude-4-opus", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "google/gemma-3n-e4b-it", + "name": "Google: Gemma 3n 4B", + "display_name": "Google: Gemma 3n 4B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 32768, + "output": 6554 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-06-12", - "last_updated": "2025-06-12", + "attachment": false, + "open_weights": true, + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 16.5, - "output": 82.5 + "input": 0.02, + "output": 0.04 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V4-Flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "google/gemini-2.5-pro-preview-05-06", + "name": "Google: Gemini 2.5 Pro Preview 05-06", + "display_name": "Google: Gemini 2.5 Pro Preview 05-06", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -51715,192 +52356,248 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "release_date": "2025-05-06", + "last_updated": "2026-03-15", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 1.25, + "output": 10, + "reasoning": 10, + "cache_read": 0.125, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V4-Pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "google/gemini-2.5-flash-lite-preview-09-2025", + "name": "Google: Gemini 2.5 Flash Lite Preview 09-2025", + "display_name": "Google: Gemini 2.5 Flash Lite Preview 09-2025", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 65536, + "context": 1048576, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "release_date": "2025-09-25", + "last_updated": "2026-03-15", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 0.1, + "output": 0.4, + "reasoning": 0.4, + "cache_read": 0.01, + "cache_write": 0.083333 }, "type": "chat" }, { - "id": "google/gemma-4-26B-A4B-it", - "name": "Gemma 4 26B", - "display_name": "Gemma 4 26B", + "id": "google/gemini-2.5-flash-lite", + "name": "Google: Gemini 2.5 Flash Lite", + "display_name": "Google: Gemini 2.5 Flash Lite", "modalities": { "input": [ + "audio", + "image", + "pdf", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-06-17", + "last_updated": "2026-03-15", "cost": { - "input": 0.07, - "output": 0.34 + "input": 0.1, + "output": 0.4, + "reasoning": 0.4, + "cache_read": 0.01, + "cache_write": 0.083333 }, "type": "chat" }, { - "id": "google/gemma-4-31B-it", - "name": "Gemma 4 31B", - "display_name": "Gemma 4 31B", + "id": "google/lyria-3-clip-preview", + "name": "Google: Lyria 3 Clip Preview", + "display_name": "Google: Lyria 3 Clip Preview", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ + "audio", "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-30", + "last_updated": "2026-04-11", "cost": { - "input": 0.13, - "output": 0.38 + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "qiniu-ai": { - "id": "qiniu-ai", - "name": "Qiniu", - "display_name": "Qiniu", - "api": "https://api.qnaigc.com/v1", - "doc": "https://developer.qiniu.com/aitokenapi", - "models": [ + }, { - "id": "qwen3-235b-a22b", - "name": "Qwen 3 235B A22B", - "display_name": "Qwen 3 235B A22B", + "id": "google/gemini-3.1-pro-preview-customtools", + "name": "Google: Gemini 3.1 Pro Preview Custom Tools", + "display_name": "Google: Gemini 3.1 Pro Preview Custom Tools", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-02-26", + "last_updated": "2026-03-15", + "cost": { + "input": 2, + "output": 12, + "reasoning": 12 + }, "type": "chat" }, { - "id": "doubao-seed-1.6-flash", - "name": "Doubao-Seed 1.6 Flash", - "display_name": "Doubao-Seed 1.6 Flash", + "id": "google/gemini-2.0-flash-lite-001", + "name": "Google: Gemini 2.0 Flash Lite", + "display_name": "Google: Gemini 2.0 Flash Lite", "modalities": { "input": [ - "text", + "audio", "image", + "pdf", + "text", "video" ], "output": [ @@ -51908,56 +52605,71 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 1048576, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-08-15", - "last_updated": "2025-08-15", + "release_date": "2024-12-11", + "last_updated": "2026-03-15", + "cost": { + "input": 0.075, + "output": 0.3 + }, "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235b A22B Instruct 2507", - "display_name": "Qwen3 235b A22B Instruct 2507", + "id": "google/gemini-2.0-flash-001", + "name": "Google: Gemini 2.0 Flash", + "display_name": "Google: Gemini 2.0 Flash", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 64000 + "context": 1048576, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-12", - "last_updated": "2025-08-12", + "release_date": "2024-12-11", + "last_updated": "2026-03-15", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025, + "cache_write": 0.083333 + }, "type": "chat" }, { - "id": "doubao-seed-2.0-code", - "name": "Doubao Seed 2.0 Code", - "display_name": "Doubao Seed 2.0 Code", + "id": "google/gemini-3.1-flash-lite-preview", + "name": "Google: Gemini 3.1 Flash Lite Preview", + "display_name": "Google: Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ - "text", + "audio", "image", + "pdf", + "text", "video" ], "output": [ @@ -51965,8 +52677,8 @@ ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -51974,54 +52686,95 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "release_date": "2026-03-03", + "last_updated": "2026-03-15", + "cost": { + "input": 0.25, + "output": 1.5, + "reasoning": 1.5 + }, "type": "chat" }, { - "id": "deepseek-v3-0324", - "name": "DeepSeek-V3-0324", - "display_name": "DeepSeek-V3-0324", + "id": "google/gemini-3.1-pro-preview", + "name": "Google: Gemini 3.1 Pro Preview", + "display_name": "Google: Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-02-19", + "last_updated": "2026-03-15", + "cost": { + "input": 2, + "output": 12, + "reasoning": 12 + }, "type": "chat" }, { - "id": "doubao-1.5-thinking-pro", - "name": "Doubao 1.5 Thinking Pro", - "display_name": "Doubao 1.5 Thinking Pro", + "id": "google/gemini-3-flash-preview", + "name": "Google: Gemini 3 Flash Preview", + "display_name": "Google: Gemini 3 Flash Preview", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -52029,146 +52782,154 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-12-17", + "last_updated": "2026-03-15", + "cost": { + "input": 0.5, + "output": 3, + "reasoning": 3, + "cache_read": 0.05, + "cache_write": 0.083333 + }, "type": "chat" }, { - "id": "claude-3.7-sonnet", - "name": "Claude 3.7 Sonnet", - "display_name": "Claude 3.7 Sonnet", + "id": "google/gemma-2-27b-it", + "name": "Google: Gemma 2 27B", + "display_name": "Google: Gemma 2 27B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2024-06-24", + "last_updated": "2024-06-24", + "cost": { + "input": 0.65, + "output": 0.65 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", "type": "chat" }, { - "id": "qwen3.5-397b-a17b", - "name": "Qwen3.5 397B A17B", - "display_name": "Qwen3.5 397B A17B", + "id": "google/lyria-3-pro-preview", + "name": "Google: Lyria 3 Pro Preview", + "display_name": "Google: Lyria 3 Pro Preview", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ + "audio", "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-02-22", - "last_updated": "2026-02-22", + "release_date": "2026-03-30", + "last_updated": "2026-04-11", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "qwen-vl-max-2025-01-25", - "name": "Qwen VL-MAX-2025-01-25", - "display_name": "Qwen VL-MAX-2025-01-25", + "id": "google/gemma-3-12b-it", + "name": "Google: Gemma 3 12B", + "display_name": "Google: Gemma 3 12B", "modalities": { "input": [ - "text", "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "release_date": "2025-03-13", + "last_updated": "2026-03-15", + "cost": { + "input": 0.04, + "output": 0.13, + "cache_read": 0.015 + }, "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "google/gemini-2.5-flash", + "name": "Google: Gemini 2.5 Flash", + "display_name": "Google: Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 40000, - "output": 4096 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -52179,277 +52940,261 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-07-17", + "last_updated": "2026-03-15", + "cost": { + "input": 0.3, + "output": 2.5, + "reasoning": 2.5, + "cache_read": 0.03, + "cache_write": 0.083333 + }, "type": "chat" }, { - "id": "doubao-1.5-pro-32k", - "name": "Doubao 1.5 Pro 32k", - "display_name": "Doubao 1.5 Pro 32k", + "id": "google/gemini-2.5-flash-image", + "name": "Google: Nano Banana (Gemini 2.5 Flash Image)", + "display_name": "Google: Nano Banana (Gemini 2.5 Flash Image)", "modalities": { "input": [ + "image", "text" ], "output": [ + "image", "text" ] }, "limit": { - "context": 128000, - "output": 12000 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "type": "chat" + "release_date": "2025-10-08", + "last_updated": "2026-03-15", + "cost": { + "input": 0.3, + "output": 2.5 + }, + "type": "imageGeneration" }, { - "id": "qwen2.5-vl-72b-instruct", - "name": "Qwen 2.5 VL 72B Instruct", - "display_name": "Qwen 2.5 VL 72B Instruct", + "id": "google/gemma-3-4b-it", + "name": "Google: Gemma 3 4B", + "display_name": "Google: Gemma 3 4B", "modalities": { "input": [ - "text", "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 19200 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "release_date": "2025-03-13", + "last_updated": "2026-03-15", + "cost": { + "input": 0.04, + "output": 0.08 + }, "type": "chat" }, { - "id": "gemini-2.0-flash", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "microsoft/phi-4", + "name": "Microsoft: Phi 4", + "display_name": "Microsoft: Phi 4", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "cost": { + "input": 0.06, + "output": 0.14 + }, "type": "chat" }, { - "id": "qwen3-vl-30b-a3b-thinking", - "name": "Qwen3-Vl 30b A3b Thinking", - "display_name": "Qwen3-Vl 30b A3b Thinking", + "id": "microsoft/wizardlm-2-8x22b", + "name": "WizardLM-2 8x22B", + "display_name": "WizardLM-2 8x22B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 65535, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2024-04-24", + "last_updated": "2024-04-24", + "cost": { + "input": 0.62, + "output": 0.62 }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-09", - "last_updated": "2026-02-09", "type": "chat" }, { - "id": "gemini-3.0-pro-image-preview", - "name": "Gemini 3.0 Pro Image Preview", - "display_name": "Gemini 3.0 Pro Image Preview", + "id": "microsoft/phi-4-mini-instruct", + "name": "Microsoft: Phi 4 Mini Instruct", + "display_name": "Microsoft: Phi 4 Mini Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2025-10-17", + "last_updated": "2026-05-07", + "cost": { + "input": 0.08, + "output": 0.35, + "cache_read": 0.08 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-20", - "last_updated": "2025-11-20", "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "gryphe/mythomax-l2-13b", + "name": "MythoMax 13B", + "display_name": "MythoMax 13B", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 4096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2024-04-25", + "last_updated": "2024-04-25", + "cost": { + "input": 0.06, + "output": 0.06 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", "type": "chat" }, { - "id": "claude-4.5-opus", - "name": "Claude 4.5 Opus", - "display_name": "Claude 4.5 Opus", + "id": "nex-agi/deepseek-v3.1-nex-n1", + "name": "Nex AGI: DeepSeek V3.1 Nex N1", + "display_name": "Nex AGI: DeepSeek V3.1 Nex N1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 131072, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-25", + "release_date": "2025-01-01", "last_updated": "2025-11-25", + "cost": { + "input": 0.27, + "output": 1 + }, "type": "chat" }, { - "id": "deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "upstage/solar-pro-3", + "name": "Upstage: Solar Pro 3", + "display_name": "Upstage: Solar Pro 3", "modalities": { "input": [ "text" @@ -52460,7 +53205,7 @@ }, "limit": { "context": 128000, - "output": 32000 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -52468,39 +53213,62 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-01-27", + "last_updated": "2026-03-15", + "cost": { + "input": 0.15, + "output": 0.6 + }, "type": "chat" }, { - "id": "claude-4.0-opus", - "name": "Claude 4.0 Opus", - "display_name": "Claude 4.0 Opus", + "id": "anthracite-org/magnum-v4-72b", + "name": "Magnum v4 72B", + "display_name": "Magnum v4 72B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 16384, + "output": 2048 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-10-22", + "last_updated": "2026-03-15", + "cost": { + "input": 3, + "output": 5 + }, + "type": "chat" + }, + { + "id": "deepseek/deepseek-v3.2-exp", + "name": "DeepSeek: DeepSeek V3.2 Exp", + "display_name": "DeepSeek: DeepSeek V3.2 Exp", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -52508,45 +53276,52 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-01-01", + "last_updated": "2025-09-29", + "cost": { + "input": 0.27, + "output": 0.41 + }, "type": "chat" }, { - "id": "claude-4.5-haiku", - "name": "Claude 4.5 Haiku", - "display_name": "Claude 4.5 Haiku", + "id": "deepseek/deepseek-chat", + "name": "DeepSeek: DeepSeek V3", + "display_name": "DeepSeek: DeepSeek V3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-12-01", + "last_updated": "2026-03-15", + "cost": { + "input": 0.32, + "output": 0.89, + "cache_read": 0.15 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-16", - "last_updated": "2025-10-16", "type": "chat" }, { - "id": "qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "deepseek/deepseek-r1", + "name": "DeepSeek: R1", + "display_name": "DeepSeek: R1", "modalities": { "input": [ "text" @@ -52556,13 +53331,14 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 64000, + "output": 16000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -52576,30 +53352,30 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "open_weights": true, + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "cost": { + "input": 0.7, + "output": 2.5 + }, "type": "chat" }, { - "id": "gemini-3.0-flash-preview", - "name": "Gemini 3.0 Flash Preview", - "display_name": "Gemini 3.0 Flash Preview", + "id": "deepseek/deepseek-v4-pro", + "name": "DeepSeek: DeepSeek V4 Pro", + "display_name": "DeepSeek: DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 1048576, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -52610,60 +53386,73 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-18", - "last_updated": "2025-12-18", + "release_date": "2026-04-24", + "last_updated": "2026-05-01", + "cost": { + "input": 0.435, + "output": 0.87, + "cache_read": 0.003625 + }, "type": "chat" }, { - "id": "gemini-2.5-flash-image", - "name": "Gemini 2.5 Flash Image", - "display_name": "Gemini 2.5 Flash Image", + "id": "deepseek/deepseek-r1-0528", + "name": "DeepSeek: R1 0528", + "display_name": "DeepSeek: R1 0528", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 163840, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-22", - "last_updated": "2025-10-22", - "type": "imageGeneration" + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-05-28", + "last_updated": "2026-03-15", + "cost": { + "input": 0.45, + "output": 2.15, + "cache_read": 0.2 + }, + "type": "chat" }, { - "id": "glm-4.5", - "name": "GLM 4.5", - "display_name": "GLM 4.5", + "id": "deepseek/deepseek-v3.2-speciale", + "name": "DeepSeek: DeepSeek V3.2 Speciale", + "display_name": "DeepSeek: DeepSeek V3.2 Speciale", "modalities": { "input": [ "text" @@ -52673,37 +53462,41 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 163840, + "output": 163840 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "release_date": "2025-12-01", + "last_updated": "2026-03-15", + "cost": { + "input": 0.4, + "output": 1.2, + "cache_read": 0.135 + }, "type": "chat" }, { - "id": "claude-3.5-sonnet", - "name": "Claude 3.5 Sonnet", - "display_name": "Claude 3.5 Sonnet", + "id": "deepseek/deepseek-v3.2", + "name": "DeepSeek: DeepSeek V3.2", + "display_name": "DeepSeek: DeepSeek V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8200 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -52711,45 +53504,58 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-09", - "last_updated": "2025-09-09", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-01", + "last_updated": "2026-03-15", + "cost": { + "input": 0.26, + "output": 0.38, + "cache_read": 0.125 + }, "type": "chat" }, { - "id": "claude-4.0-sonnet", - "name": "Claude 4.0 Sonnet", - "display_name": "Claude 4.0 Sonnet", + "id": "deepseek/deepseek-v4-flash:free", + "name": "DeepSeek: DeepSeek V4 Flash (free)", + "display_name": "DeepSeek: DeepSeek V4 Flash (free)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 384000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-04-24", + "last_updated": "2026-05-16", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b-instruct-2507", - "name": "Qwen3 30b A3b Instruct 2507", - "display_name": "Qwen3 30b A3b Instruct 2507", + "id": "deepseek/deepseek-v4-flash", + "name": "DeepSeek: DeepSeek V4 Flash", + "display_name": "DeepSeek: DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -52759,37 +53565,52 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 1048576, + "output": 384000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2026-02-04", - "last_updated": "2026-02-04", + "release_date": "2026-04-24", + "last_updated": "2026-05-01", + "cost": { + "input": 0.14, + "output": 0.28, + "cache_read": 0.0028 + }, "type": "chat" }, { - "id": "doubao-seed-1.6-thinking", - "name": "Doubao-Seed 1.6 Thinking", - "display_name": "Doubao-Seed 1.6 Thinking", + "id": "deepseek/deepseek-chat-v3-0324", + "name": "DeepSeek: DeepSeek V3 0324", + "display_name": "DeepSeek: DeepSeek V3 0324", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -52797,67 +53618,59 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-15", - "last_updated": "2025-08-15", + "attachment": false, + "open_weights": true, + "release_date": "2025-03-24", + "last_updated": "2026-03-15", + "cost": { + "input": 0.2, + "output": 0.77, + "cache_read": 0.095 + }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "deepseek/deepseek-r1-distill-llama-70b", + "name": "DeepSeek: R1 Distill Llama 70B", + "display_name": "DeepSeek: R1 Distill Llama 70B", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 64000 + "context": 131072, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-01-23", + "last_updated": "2026-03-15", + "cost": { + "input": 0.7, + "output": 0.8, + "cache_read": 0.015 + }, "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "deepseek/deepseek-r1-distill-qwen-32b", + "name": "DeepSeek: R1 Distill Qwen 32B", + "display_name": "DeepSeek: R1 Distill Qwen 32B", "modalities": { "input": [ "text" @@ -52867,36 +53680,29 @@ ] }, "limit": { - "context": 262144, - "output": 4096 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-12", - "last_updated": "2025-08-12", + "open_weights": true, + "release_date": "2025-01-01", + "last_updated": "2025-11-25", + "cost": { + "input": 0.29, + "output": 0.29 + }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "deepseek/deepseek-chat-v3.1", + "name": "DeepSeek: DeepSeek V3.1", + "display_name": "DeepSeek: DeepSeek V3.1", "modalities": { "input": [ "text" @@ -52906,8 +53712,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 32768, + "output": 7168 }, "temperature": true, "tool_call": true, @@ -52915,27 +53721,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-12", - "last_updated": "2025-09-12", + "open_weights": true, + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "cost": { + "input": 0.15, + "output": 0.75 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b-thinking-2507", - "name": "Qwen3 30b A3b Thinking 2507", - "display_name": "Qwen3 30b A3b Thinking 2507", + "id": "deepseek/deepseek-v3.1-terminus", + "name": "DeepSeek: DeepSeek V3.1 Terminus", + "display_name": "DeepSeek: DeepSeek V3.1 Terminus", "modalities": { "input": [ "text" @@ -52945,8 +53744,8 @@ ] }, "limit": { - "context": 126000, - "output": 32000 + "context": 163840, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -52954,55 +53753,53 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-04", - "last_updated": "2026-02-04", + "open_weights": true, + "release_date": "2025-09-22", + "last_updated": "2025-09-22", + "cost": { + "input": 0.21, + "output": 0.79, + "cache_read": 0.13 + }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "perplexity/sonar", + "name": "Perplexity: Sonar", + "display_name": "Perplexity: Sonar", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 4096 + "context": 127072, + "output": 25415 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", + "cost": { + "input": 1, + "output": 1 + }, "type": "chat" }, { - "id": "deepseek-v3.1", - "name": "DeepSeek-V3.1", - "display_name": "DeepSeek-V3.1", + "id": "perplexity/sonar-deep-research", + "name": "Perplexity: Sonar Deep Research", + "display_name": "Perplexity: Sonar Deep Research", "modalities": { "input": [ "text" @@ -53013,67 +53810,65 @@ }, "limit": { "context": 128000, - "output": 32000 + "output": 25600 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-08-19", - "last_updated": "2025-08-19", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", + "cost": { + "input": 2, + "output": 8 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "perplexity/sonar-reasoning-pro", + "name": "Perplexity: Sonar Reasoning Pro", + "display_name": "Perplexity: Sonar Reasoning Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 40000, - "output": 4096 + "context": 128000, + "output": 25600 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", + "cost": { + "input": 2, + "output": 8 + }, "type": "chat" }, { - "id": "claude-4.1-opus", - "name": "Claude 4.1 Opus", - "display_name": "Claude 4.1 Opus", + "id": "perplexity/sonar-pro-search", + "name": "Perplexity: Sonar Pro Search", + "display_name": "Perplexity: Sonar Pro Search", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" @@ -53081,54 +53876,60 @@ }, "limit": { "context": 200000, - "output": 32000 + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", + "release_date": "2025-10-31", + "last_updated": "2026-03-15", + "cost": { + "input": 3, + "output": 15 + }, "type": "chat" }, { - "id": "doubao-seed-2.0-mini", - "name": "Doubao Seed 2.0 Mini", - "display_name": "Doubao Seed 2.0 Mini", + "id": "perplexity/sonar-pro", + "name": "Perplexity: Sonar Pro", + "display_name": "Perplexity: Sonar Pro", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 200000, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", + "cost": { + "input": 3, + "output": 15 + }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "ai21/jamba-large-1.7", + "name": "AI21: Jamba Large 1.7", + "display_name": "AI21: Jamba Large 1.7", "modalities": { "input": [ "text" @@ -53138,8 +53939,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 256000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -53148,58 +53949,61 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-09-12", - "last_updated": "2025-09-12", + "release_date": "2025-08-09", + "last_updated": "2026-03-15", + "cost": { + "input": 2, + "output": 8 + }, "type": "chat" }, { - "id": "doubao-seed-1.6", - "name": "Doubao-Seed 1.6", - "display_name": "Doubao-Seed 1.6", + "id": "meta-llama/llama-3.1-70b-instruct", + "name": "Meta: Llama 3.1 70B Instruct", + "display_name": "Meta: Llama 3.1 70B Instruct", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 131072, + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-07-16", + "last_updated": "2024-07-23", + "cost": { + "input": 0.4, + "output": 0.4 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-15", - "last_updated": "2025-08-15", "type": "chat" }, { - "id": "qwen2.5-vl-7b-instruct", - "name": "Qwen 2.5 VL 7B Instruct", - "display_name": "Qwen 2.5 VL 7B Instruct", + "id": "meta-llama/llama-4-scout", + "name": "Meta: Llama 4 Scout", + "display_name": "Meta: Llama 4 Scout", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 327680, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -53207,44 +54011,50 @@ "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "cost": { + "input": 0.08, + "output": 0.3 + }, "type": "chat" }, { - "id": "kling-v2-6", - "name": "Kling-V2 6", - "display_name": "Kling-V2 6", + "id": "meta-llama/llama-3.2-1b-instruct", + "name": "Meta: Llama 3.2 1B Instruct", + "display_name": "Meta: Llama 3.2 1B Instruct", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 99999999, - "output": 99999999 + "context": 60000, + "output": 12000 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-01-13", - "last_updated": "2026-01-13", + "attachment": false, + "open_weights": true, + "release_date": "2024-09-18", + "last_updated": "2026-01-27", + "cost": { + "input": 0.027, + "output": 0.2 + }, "type": "chat" }, { - "id": "MiniMax-M1", - "name": "MiniMax M1", - "display_name": "MiniMax M1", + "id": "meta-llama/llama-guard-3-8b", + "name": "Llama Guard 3 8B", + "display_name": "Llama Guard 3 8B", "modalities": { "input": [ "text" @@ -53254,104 +54064,91 @@ ] }, "limit": { - "context": 1000000, - "output": 80000 + "context": 131072, + "output": 26215 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "release_date": "2024-04-18", + "last_updated": "2026-02-04", + "cost": { + "input": 0.02, + "output": 0.06 + }, "type": "chat" }, { - "id": "gemini-3.0-pro-preview", - "name": "Gemini 3.0 Pro Preview", - "display_name": "Gemini 3.0 Pro Preview", + "id": "meta-llama/llama-3-70b-instruct", + "name": "Meta: Llama 3 70B Instruct", + "display_name": "Meta: Llama 3 70B Instruct", "modalities": { "input": [ - "text", - "image", - "video", - "pdf", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 8192, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0.51, + "output": 0.74 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", "type": "chat" }, { - "id": "doubao-seed-2.0-lite", - "name": "Doubao Seed 2.0 Lite", - "display_name": "Doubao Seed 2.0 Lite", + "id": "meta-llama/llama-3.2-11b-vision-instruct", + "name": "Meta: Llama 3.2 11B Vision Instruct", + "display_name": "Meta: Llama 3.2 11B Vision Instruct", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 131072, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "open_weights": true, + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "cost": { + "input": 0.049, + "output": 0.049 + }, "type": "chat" }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "meta-llama/llama-3-8b-instruct", + "name": "Meta: Llama 3 8B Instruct", + "display_name": "Meta: Llama 3 8B Instruct", "modalities": { "input": [ "text" @@ -53361,8 +54158,8 @@ ] }, "limit": { - "context": 262000, - "output": 4096 + "context": 8192, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -53370,15 +54167,19 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-14", - "last_updated": "2025-08-14", + "open_weights": true, + "release_date": "2024-04-25", + "last_updated": "2025-04-03", + "cost": { + "input": 0.03, + "output": 0.04 + }, "type": "chat" }, { - "id": "claude-3.5-haiku", - "name": "Claude 3.5 Haiku", - "display_name": "Claude 3.5 Haiku", + "id": "meta-llama/llama-4-maverick", + "name": "Meta: Llama 4 Maverick", + "display_name": "Meta: Llama 4 Maverick", "modalities": { "input": [ "text", @@ -53389,8 +54190,8 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 1048576, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -53398,15 +54199,19 @@ "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-12-24", + "cost": { + "input": 0.15, + "output": 0.6 + }, "type": "chat" }, { - "id": "gpt-oss-20b", - "name": "gpt-oss-20b", - "display_name": "gpt-oss-20b", + "id": "meta-llama/llama-3.3-70b-instruct", + "name": "Meta: Llama 3.3 70B Instruct", + "display_name": "Meta: Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -53416,30 +54221,28 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", + "open_weights": true, + "release_date": "2024-08-01", + "last_updated": "2026-02-04", + "cost": { + "input": 0.1, + "output": 0.32 + }, "type": "chat" }, { - "id": "qwen-turbo", - "name": "Qwen-Turbo", - "display_name": "Qwen-Turbo", + "id": "meta-llama/llama-3.2-3b-instruct", + "name": "Meta: Llama 3.2 3B Instruct", + "display_name": "Meta: Llama 3.2 3B Instruct", "modalities": { "input": [ "text" @@ -53449,38 +54252,31 @@ ] }, "limit": { - "context": 1000000, - "output": 4096 + "context": 80000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "release_date": "2024-09-18", + "last_updated": "2026-03-15", + "cost": { + "input": 0.051, + "output": 0.34 + }, "type": "chat" }, { - "id": "kimi-k2", - "name": "Kimi K2", - "display_name": "Kimi K2", + "id": "meta-llama/llama-guard-4-12b", + "name": "Meta: Llama Guard 4 12B", + "display_name": "Meta: Llama Guard 4 12B", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -53488,76 +54284,62 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 163840, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "cost": { + "input": 0.18, + "output": 0.18 + }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "meta-llama/llama-3.1-8b-instruct", + "name": "Meta: Llama 3.1 8B Instruct", + "display_name": "Meta: Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 64000 + "context": 16384, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2025-12-23", + "cost": { + "input": 0.02, + "output": 0.05 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", "type": "chat" }, { - "id": "qwen3-max-preview", - "name": "Qwen3 Max Preview", - "display_name": "Qwen3 Max Preview", + "id": "arcee-ai/spotlight", + "name": "Arcee AI: Spotlight", + "display_name": "Arcee AI: Spotlight", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -53565,35 +54347,28 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 131072, + "output": 65537 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": true, + "open_weights": true, + "release_date": "2025-05-06", + "last_updated": "2026-03-15", + "cost": { + "input": 0.18, + "output": 0.18 }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-06", - "last_updated": "2025-09-06", "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "arcee-ai/trinity-mini", + "name": "Arcee AI: Trinity Mini", + "display_name": "Arcee AI: Trinity Mini", "modalities": { "input": [ "text" @@ -53603,8 +54378,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -53612,79 +54387,82 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", + "open_weights": true, + "release_date": "2025-12", + "last_updated": "2026-01-28", + "cost": { + "input": 0.045, + "output": 0.15 + }, "type": "chat" }, { - "id": "doubao-1.5-vision-pro", - "name": "Doubao 1.5 Vision Pro", - "display_name": "Doubao 1.5 Vision Pro", + "id": "arcee-ai/maestro-reasoning", + "name": "Arcee AI: Maestro Reasoning", + "display_name": "Arcee AI: Maestro Reasoning", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 131072, + "output": 32000 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-05-06", + "last_updated": "2026-03-15", + "cost": { + "input": 0.9, + "output": 3.3 + }, "type": "chat" }, { - "id": "claude-4.5-sonnet", - "name": "Claude 4.5 Sonnet", - "display_name": "Claude 4.5 Sonnet", + "id": "arcee-ai/coder-large", + "name": "Arcee AI: Coder Large", + "display_name": "Arcee AI: Coder Large", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-05-06", + "last_updated": "2026-03-15", + "cost": { + "input": 0.5, + "output": 0.8 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", "type": "chat" }, { - "id": "deepseek-v3", - "name": "DeepSeek-V3", - "display_name": "DeepSeek-V3", + "id": "arcee-ai/virtuoso-large", + "name": "Arcee AI: Virtuoso Large", + "display_name": "Arcee AI: Virtuoso Large", "modalities": { "input": [ "text" @@ -53694,24 +54472,28 @@ ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 131072, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-13", - "last_updated": "2025-08-13", + "open_weights": true, + "release_date": "2025-05-06", + "last_updated": "2026-03-15", + "cost": { + "input": 0.75, + "output": 1.2 + }, "type": "chat" }, { - "id": "deepseek-r1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "arcee-ai/trinity-large-thinking", + "name": "Arcee AI: Trinity Large Thinking", + "display_name": "Arcee AI: Trinity Large Thinking", "modalities": { "input": [ "text" @@ -53721,8 +54503,8 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -53730,41 +54512,63 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2026-04-01", + "last_updated": "2026-04-11", + "cost": { + "input": 0.22, + "output": 0.85 + }, + "type": "chat" + }, + { + "id": "arcee-ai/trinity-large-preview", + "name": "Arcee AI: Trinity Large Preview", + "display_name": "Arcee AI: Trinity Large Preview", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131000, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-01-28", + "last_updated": "2026-05-01", + "cost": { + "input": 0.15, + "output": 0.45 + }, "type": "chat" }, { - "id": "gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash Lite", - "display_name": "Gemini 2.0 Flash Lite", + "id": "kilo-auto/frontier", + "name": "Kilo Auto Frontier", + "display_name": "Kilo Auto Frontier", "modalities": { "input": [ - "text", "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -53774,14 +54578,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-03-15", + "last_updated": "2026-03-15", + "cost": { + "input": 5, + "output": 25 + }, "type": "chat" }, { - "id": "qwen-max-2025-01-25", - "name": "Qwen2.5-Max-2025-01-25", - "display_name": "Qwen2.5-Max-2025-01-25", + "id": "kilo-auto/balanced", + "name": "Kilo Auto Balanced", + "display_name": "Kilo Auto Balanced", "modalities": { "input": [ "text" @@ -53791,36 +54599,40 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-03-15", + "last_updated": "2026-03-15", + "cost": { + "input": 0.6, + "output": 3 + }, "type": "chat" }, { - "id": "doubao-seed-2.0-pro", - "name": "Doubao Seed 2.0 Pro", - "display_name": "Doubao Seed 2.0 Pro", + "id": "kilo-auto/small", + "name": "Kilo Auto Small", + "display_name": "Kilo Auto Small", "modalities": { "input": [ - "text", "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 400000, "output": 128000 }, "temperature": true, @@ -53831,14 +54643,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "release_date": "2026-03-15", + "last_updated": "2026-03-15", + "cost": { + "input": 0.05, + "output": 0.4 + }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-exp-thinking", - "name": "DeepSeek/DeepSeek-V3.2-Exp-Thinking", - "display_name": "DeepSeek/DeepSeek-V3.2-Exp-Thinking", + "id": "kilo-auto/free", + "name": "Kilo Auto Free", + "display_name": "Kilo Auto Free", "modalities": { "input": [ "text" @@ -53848,25 +54664,29 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 204800, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2026-03-15", + "last_updated": "2026-03-15", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1-terminus-thinking", - "name": "DeepSeek/DeepSeek-V3.1-Terminus-Thinking", - "display_name": "DeepSeek/DeepSeek-V3.1-Terminus-Thinking", + "id": "essentialai/rnj-1-instruct", + "name": "EssentialAI: Rnj 1 Instruct", + "display_name": "EssentialAI: Rnj 1 Instruct", "modalities": { "input": [ "text" @@ -53876,25 +54696,60 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 32768, + "output": 6554 }, "temperature": true, - "tool_call": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-05", + "last_updated": "2026-03-15", + "cost": { + "input": 0.15, + "output": 0.15 + }, + "type": "chat" + }, + { + "id": "alibaba/tongyi-deepresearch-30b-a3b", + "name": "Tongyi DeepResearch 30B A3B", + "display_name": "Tongyi DeepResearch 30B A3B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "release_date": "2025-09-18", + "last_updated": "2026-03-15", + "cost": { + "input": 0.09, + "output": 0.45 + }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-exp", - "name": "DeepSeek/DeepSeek-V3.2-Exp", - "display_name": "DeepSeek/DeepSeek-V3.2-Exp", + "id": "stepfun/step-3.5-flash", + "name": "StepFun: Step 3.5 Flash", + "display_name": "StepFun: Step 3.5 Flash", "modalities": { "input": [ "text" @@ -53904,24 +54759,30 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": true, + "release_date": "2026-01-29", + "last_updated": "2026-01-29", + "cost": { + "input": 0.1, + "output": 0.3, + "cache_read": 0.02 + }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-251201", - "name": "Deepseek/DeepSeek-V3.2", - "display_name": "Deepseek/DeepSeek-V3.2", + "id": "stepfun/step-3.5-flash:free", + "name": "StepFun: Step 3.5 Flash (free)", + "display_name": "StepFun: Step 3.5 Flash (free)", "modalities": { "input": [ "text" @@ -53931,8 +54792,8 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -53942,25 +54803,31 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2025-08-26", + "last_updated": "2026-05-01", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "deepseek/deepseek-math-v2", - "name": "Deepseek/Deepseek-Math-V2", - "display_name": "Deepseek/Deepseek-Math-V2", + "id": "perceptron/perceptron-mk1", + "name": "Perceptron: Perceptron Mk1", + "display_name": "Perceptron: Perceptron Mk1", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 160000, - "output": 160000 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": false, @@ -53968,21 +54835,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-04", - "last_updated": "2025-12-04", + "release_date": "2026-05-12", + "last_updated": "2026-05-16", + "cost": { + "input": 0.15, + "output": 1.5 + }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1-terminus", - "name": "DeepSeek/DeepSeek-V3.1-Terminus", - "display_name": "DeepSeek/DeepSeek-V3.1-Terminus", + "id": "allenai/olmo-3-32b-think", + "name": "AllenAI: Olmo 3 32B Think", + "display_name": "AllenAI: Olmo 3 32B Think", "modalities": { "input": [ "text" @@ -53992,113 +54858,130 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 65536, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "open_weights": true, + "release_date": "2025-11-22", + "last_updated": "2026-03-15", + "cost": { + "input": 0.15, + "output": 0.5 + }, "type": "chat" }, { - "id": "stepfun-ai/gelab-zero-4b-preview", - "name": "Stepfun-Ai/Gelab Zero 4b Preview", - "display_name": "Stepfun-Ai/Gelab Zero 4b Preview", + "id": "rekaai/reka-flash-3", + "name": "Reka Flash 3", + "display_name": "Reka Flash 3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 65536, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-03-12", + "last_updated": "2026-04-11", + "cost": { + "input": 0.1, + "output": 0.2 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", "type": "chat" }, { - "id": "stepfun/step-3.5-flash", - "name": "Stepfun/Step-3.5 Flash", - "display_name": "Stepfun/Step-3.5 Flash", + "id": "rekaai/reka-edge", + "name": "Reka Edge", + "display_name": "Reka Edge", "modalities": { "input": [ + "image", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 4096 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-02-02", - "last_updated": "2026-02-02", + "open_weights": true, + "release_date": "2026-03-20", + "last_updated": "2026-04-11", + "cost": { + "input": 0.1, + "output": 0.1 + }, "type": "chat" }, { - "id": "x-ai/grok-4-fast", - "name": "x-AI/Grok-4-Fast", - "display_name": "x-AI/Grok-4-Fast", + "id": "baidu/qianfan-ocr-fast", + "name": "Baidu: Qianfan-OCR-Fast", + "display_name": "Baidu: Qianfan-OCR-Fast", "modalities": { "input": [ - "text", "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 65536, + "output": 28672 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-09-20", - "last_updated": "2025-09-20", + "release_date": "2026-04-20", + "last_updated": "2026-05-16", + "cost": { + "input": 0.68, + "output": 2.81 + }, "type": "chat" }, { - "id": "x-ai/grok-code-fast-1", - "name": "x-AI/Grok-Code-Fast 1", - "display_name": "x-AI/Grok-Code-Fast 1", + "id": "baidu/ernie-4.5-vl-424b-a47b", + "name": "Baidu: ERNIE 4.5 VL 424B A47B ", + "display_name": "Baidu: ERNIE 4.5 VL 424B A47B ", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -54106,97 +54989,91 @@ ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 123000, + "output": 16000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "attachment": true, + "open_weights": true, + "release_date": "2025-06-30", + "last_updated": "2026-01", + "cost": { + "input": 0.42, + "output": 1.25 }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-02", - "last_updated": "2025-09-02", "type": "chat" }, { - "id": "x-ai/grok-4-fast-reasoning", - "name": "X-Ai/Grok-4-Fast-Reasoning", - "display_name": "X-Ai/Grok-4-Fast-Reasoning", + "id": "baidu/ernie-4.5-21b-a3b", + "name": "Baidu: ERNIE 4.5 21B A3B", + "display_name": "Baidu: ERNIE 4.5 21B A3B", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 120000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "attachment": false, + "open_weights": true, + "release_date": "2025-06-30", + "last_updated": "2025-06-30", + "cost": { + "input": 0.07, + "output": 0.28 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-18", - "last_updated": "2025-12-18", "type": "chat" }, { - "id": "x-ai/grok-4.1-fast-non-reasoning", - "name": "X-Ai/Grok 4.1 Fast Non Reasoning", - "display_name": "X-Ai/Grok 4.1 Fast Non Reasoning", + "id": "baidu/ernie-4.5-300b-a47b", + "name": "Baidu: ERNIE 4.5 300B A47B ", + "display_name": "Baidu: ERNIE 4.5 300B A47B ", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 123000, + "output": 12000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-06-30", + "last_updated": "2026-01", + "cost": { + "input": 0.28, + "output": 1.1 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-19", - "last_updated": "2025-12-19", "type": "chat" }, { - "id": "x-ai/grok-4.1-fast", - "name": "x-AI/Grok-4.1-Fast", - "display_name": "x-AI/Grok-4.1-Fast", + "id": "baidu/ernie-4.5-21b-a3b-thinking", + "name": "Baidu: ERNIE 4.5 21B A3B Thinking", + "display_name": "Baidu: ERNIE 4.5 21B A3B Thinking", "modalities": { "input": [ "text" @@ -54206,70 +55083,73 @@ ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 131072, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-11-20", - "last_updated": "2025-11-20", + "open_weights": true, + "release_date": "2025-09-19", + "last_updated": "2025-09-19", + "cost": { + "input": 0.07, + "output": 0.28 + }, "type": "chat" }, { - "id": "x-ai/grok-4-fast-non-reasoning", - "name": "X-Ai/Grok-4-Fast-Non-Reasoning", - "display_name": "X-Ai/Grok-4-Fast-Non-Reasoning", + "id": "baidu/cobuddy:free", + "name": "Baidu: CoBuddy (free)", + "display_name": "Baidu: CoBuddy (free)", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 131072, + "output": 65536 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-18", - "last_updated": "2025-12-18", + "release_date": "2026-05-06", + "last_updated": "2026-05-07", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "x-ai/grok-4.1-fast-reasoning", - "name": "X-Ai/Grok 4.1 Fast Reasoning", - "display_name": "X-Ai/Grok 4.1 Fast Reasoning", + "id": "baidu/ernie-4.5-vl-28b-a3b", + "name": "Baidu: ERNIE 4.5 VL 28B A3B", + "display_name": "Baidu: ERNIE 4.5 VL 28B A3B", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 20000000, - "output": 2000000 + "context": 30000, + "output": 8000 }, "temperature": true, "tool_call": true, @@ -54278,66 +55158,51 @@ "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2025-12-19", - "last_updated": "2025-12-19", + "open_weights": true, + "release_date": "2025-06-30", + "last_updated": "2025-06-30", + "cost": { + "input": 0.14, + "output": 0.56 + }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "OpenAI/GPT-5.2", - "display_name": "OpenAI/GPT-5.2", + "id": "poolside/laguna-xs.2:free", + "name": "Poolside: Laguna XS.2 (free)", + "display_name": "Poolside: Laguna XS.2 (free)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2026-04-28", + "last_updated": "2026-05-01", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "openai/gpt-5", - "name": "OpenAI/GPT-5", - "display_name": "OpenAI/GPT-5", + "id": "poolside/laguna-m.1:free", + "name": "Poolside: Laguna M.1 (free)", + "display_name": "Poolside: Laguna M.1 (free)", "modalities": { "input": [ "text" @@ -54347,8 +55212,8 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -54356,48 +55221,35 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": false, "open_weights": false, - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "release_date": "2026-04-28", + "last_updated": "2026-05-01", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "z-ai/glm-4.7", - "name": "Z-Ai/GLM 4.7", - "display_name": "Z-Ai/GLM 4.7", + "id": "xiaomi/mimo-v2-omni", + "name": "Xiaomi: MiMo-V2-Omni", + "display_name": "Xiaomi: MiMo-V2-Omni", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -54405,27 +55257,22 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0.4, + "output": 2, + "cache_read": 0.08 + }, "type": "chat" }, { - "id": "z-ai/glm-5", - "name": "Z-Ai/GLM 5", - "display_name": "Z-Ai/GLM 5", + "id": "xiaomi/mimo-v2.5-pro", + "name": "Xiaomi: MiMo V2.5 Pro", + "display_name": "Xiaomi: MiMo V2.5 Pro", "modalities": { "input": [ "text" @@ -54435,8 +55282,8 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -54456,43 +55303,71 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", + "cost": { + "input": 1, + "output": 3, + "cache_read": 0.2, + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ] + }, "type": "chat" }, { - "id": "z-ai/autoglm-phone-9b", - "name": "Z-Ai/Autoglm Phone 9b", - "display_name": "Z-Ai/Autoglm Phone 9b", + "id": "xiaomi/mimo-v2-flash", + "name": "Xiaomi: MiMo-V2-Flash", + "display_name": "Xiaomi: MiMo-V2-Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 12800, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", + "cost": { + "input": 0.09, + "output": 0.29, + "cache_read": 0.045 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", "type": "chat" }, { - "id": "z-ai/glm-4.6", - "name": "Z-AI/GLM 4.6", - "display_name": "Z-AI/GLM 4.6", + "id": "xiaomi/mimo-v2-pro", + "name": "Xiaomi: MiMo-V2-Pro", + "display_name": "Xiaomi: MiMo-V2-Pro", "modalities": { "input": [ "text" @@ -54502,40 +55377,61 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-10-11", - "last_updated": "2025-10-11", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 1, + "output": 3, + "cache_read": 0.2, + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ] + }, "type": "chat" }, { - "id": "minimax/minimax-m2", - "name": "Minimax/Minimax-M2", - "display_name": "Minimax/Minimax-M2", + "id": "xiaomi/mimo-v2.5", + "name": "Xiaomi: MiMo-V2.5", + "display_name": "Xiaomi: MiMo-V2.5", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -54545,19 +55441,56 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-10-28", - "last_updated": "2025-10-28", + "attachment": true, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", + "cost": { + "input": 0.4, + "output": 2, + "cache_read": 0.08, + "context_over_200k": { + "input": 0.8, + "output": 4, + "cache_read": 0.16 + }, + "tiers": [ + { + "input": 0.8, + "output": 4, + "cache_read": 0.16, + "tier": { + "type": "context", + "size": 256000 + } + } + ] + }, "type": "chat" - }, + } + ] + }, + "lmstudio": { + "id": "lmstudio", + "name": "LMStudio", + "display_name": "LMStudio", + "api": "http://127.0.0.1:1234/v1", + "doc": "https://lmstudio.ai/models", + "models": [ { - "id": "minimax/minimax-m2.1", - "name": "Minimax/Minimax-M2.1", - "display_name": "Minimax/Minimax-M2.1", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -54567,8 +55500,8 @@ ] }, "limit": { - "context": 204800, - "output": 128000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -54582,15 +55515,19 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "minimax/minimax-m2.5", - "name": "Minimax/Minimax-M2.5", - "display_name": "Minimax/Minimax-M2.5", + "id": "qwen/qwen3-coder-30b", + "name": "Qwen3 Coder 30B", + "display_name": "Qwen3 Coder 30B", "modalities": { "input": [ "text" @@ -54600,30 +55537,29 @@ ] }, "limit": { - "context": 204800, - "output": 128000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "minimax/minimax-m2.5-highspeed", - "name": "Minimax/Minimax-M2.5 Highspeed", - "display_name": "Minimax/Minimax-M2.5 Highspeed", + "id": "qwen/qwen3-30b-a3b-2507", + "name": "Qwen3 30B A3B 2507", + "display_name": "Qwen3 30B A3B 2507", "modalities": { "input": [ "text" @@ -54633,48 +55569,89 @@ ] }, "limit": { - "context": 204800, - "output": 128000 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + } + ] + }, + "xiaomi-token-plan-cn": { + "id": "xiaomi-token-plan-cn", + "name": "Xiaomi Token Plan (China)", + "display_name": "Xiaomi Token Plan (China)", + "api": "https://token-plan-cn.xiaomimimo.com/v1", + "doc": "https://platform.xiaomimimo.com/#/docs", + "models": [ + { + "id": "mimo-v2-tts", + "name": "MiMo-V2-TTS", + "display_name": "MiMo-V2-TTS", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "limit": { + "context": 8192, + "output": 16384 + }, + "tool_call": false, + "reasoning": { + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.5", - "name": "Moonshotai/Kimi-K2.5", - "display_name": "Moonshotai/Kimi-K2.5", + "id": "mimo-v2-omni", + "name": "MiMo-V2-Omni", + "display_name": "MiMo-V2-Omni", "modalities": { "input": [ "text", "image", - "video" + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -54689,14 +55666,20 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-01-28", - "last_updated": "2026-01-28", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 + }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "mimo-v2.5-pro", + "name": "MiMo-V2.5-Pro", + "display_name": "MiMo-V2.5-Pro", "modalities": { "input": [ "text" @@ -54706,24 +55689,42 @@ ] }, "limit": { - "context": 256000, - "output": 100000 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-08", - "last_updated": "2025-09-08", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 + }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "mimo-v2-flash", + "name": "MiMo-V2-Flash", + "display_name": "MiMo-V2-Flash", "modalities": { "input": [ "text" @@ -54733,13 +55734,14 @@ ] }, "limit": { - "context": 256000, - "output": 100000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -54753,15 +55755,21 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-11-07", - "last_updated": "2025-11-07", + "open_weights": true, + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 + }, "type": "chat" }, { - "id": "meituan/longcat-flash-chat", - "name": "Meituan/Longcat-Flash-Chat", - "display_name": "Meituan/Longcat-Flash-Chat", + "id": "mimo-v2-pro", + "name": "MiMo-V2-Pro", + "display_name": "MiMo-V2-Pro", "modalities": { "input": [ "text" @@ -54771,62 +55779,110 @@ ] }, "limit": { - "context": 131072, + "context": 1048576, "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-11-05", - "last_updated": "2025-11-05", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 + }, "type": "chat" }, { - "id": "meituan/longcat-flash-lite", - "name": "Meituan/Longcat-Flash-Lite", - "display_name": "Meituan/Longcat-Flash-Lite", - "modalities": { - "input": [ - "text" + "id": "mimo-v2.5", + "name": "MiMo-V2.5", + "display_name": "MiMo-V2.5", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 320000 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 }, - "attachment": false, - "open_weights": false, - "release_date": "2026-02-06", - "last_updated": "2026-02-06", "type": "chat" - }, + } + ] + }, + "v0": { + "id": "v0", + "name": "v0", + "display_name": "v0", + "doc": "https://sdk.vercel.ai/providers/ai-sdk-providers/vercel", + "models": [ { - "id": "mimo-v2-flash", - "name": "Mimo-V2-Flash", - "display_name": "Mimo-V2-Flash", + "id": "v0-1.5-md", + "name": "v0-1.5-md", + "display_name": "v0-1.5-md", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -54834,33 +55890,32 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", + "attachment": true, + "open_weights": false, + "release_date": "2025-06-09", + "last_updated": "2025-06-09", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash", - "name": "Xiaomi/Mimo-V2-Flash", - "display_name": "Xiaomi/Mimo-V2-Flash", + "id": "v0-1.5-lg", + "name": "v0-1.5-lg", + "display_name": "v0-1.5-lg", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 512000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -54868,64 +55923,62 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", + "attachment": true, + "open_weights": false, + "release_date": "2025-06-09", + "last_updated": "2025-06-09", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01 + "input": 15, + "output": 75 }, "type": "chat" - } - ] - }, - "kilo": { - "id": "kilo", - "name": "Kilo Gateway", - "display_name": "Kilo Gateway", - "api": "https://api.kilo.ai/api/gateway", - "doc": "https://kilo.ai", - "models": [ + }, { - "id": "rekaai/reka-edge", - "name": "Reka Edge", - "display_name": "Reka Edge", + "id": "v0-1.0-md", + "name": "v0-1.0-md", + "display_name": "v0-1.0-md", "modalities": { "input": [ - "image", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2026-03-20", - "last_updated": "2026-04-11", + "open_weights": false, + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.1, - "output": 0.1 + "input": 3, + "output": 15 }, "type": "chat" - }, + } + ] + }, + "morph": { + "id": "morph", + "name": "Morph", + "display_name": "Morph", + "api": "https://api.morphllm.com/v1", + "doc": "https://docs.morphllm.com/api-reference/introduction", + "models": [ { - "id": "rekaai/reka-flash-3", - "name": "Reka Flash 3", - "display_name": "Reka Flash 3", + "id": "morph-v3-large", + "name": "Morph v3 Large", + "display_name": "Morph v3 Large", "modalities": { "input": [ "text" @@ -54935,29 +55988,28 @@ ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 32000, + "output": 32000 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-03-12", - "last_updated": "2026-04-11", + "open_weights": false, + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 0.1, - "output": 0.2 + "input": 0.9, + "output": 1.9 }, "type": "chat" }, { - "id": "ai21/jamba-large-1.7", - "name": "AI21: Jamba Large 1.7", - "display_name": "AI21: Jamba Large 1.7", + "id": "auto", + "name": "Auto", + "display_name": "Auto", "modalities": { "input": [ "text" @@ -54967,28 +56019,28 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 32000, + "output": 32000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-09", - "last_updated": "2026-03-15", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 2, - "output": 8 + "input": 0.85, + "output": 1.55 }, "type": "chat" }, { - "id": "alibaba/tongyi-deepresearch-30b-a3b", - "name": "Tongyi DeepResearch 30B A3B", - "display_name": "Tongyi DeepResearch 30B A3B", + "id": "morph-v3-fast", + "name": "Morph v3 Fast", + "display_name": "Morph v3 Fast", "modalities": { "input": [ "text" @@ -54998,60 +56050,68 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 16000, + "output": 16000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2026-03-15", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 0.09, - "output": 0.45 + "input": 0.8, + "output": 1.2 }, "type": "chat" - }, + } + ] + }, + "nearai": { + "id": "nearai", + "name": "NEAR AI Cloud", + "display_name": "NEAR AI Cloud", + "api": "https://cloud-api.near.ai/v1", + "doc": "https://docs.near.ai/", + "models": [ { - "id": "inflection/inflection-3-pi", - "name": "Inflection: Inflection 3 Pi", - "display_name": "Inflection: Inflection 3 Pi", + "id": "openai/whisper-large-v3", + "name": "Whisper Large v3", + "display_name": "Whisper Large v3", "modalities": { "input": [ - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 8000, - "output": 1024 + "context": 448, + "output": 448 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-10-11", - "last_updated": "2026-03-15", + "open_weights": true, + "release_date": "2023-11-06", + "last_updated": "2023-11-06", "cost": { - "input": 2.5, - "output": 10 + "input": 0.01, + "output": 0 }, "type": "chat" }, { - "id": "inflection/inflection-3-productivity", - "name": "Inflection: Inflection 3 Productivity", - "display_name": "Inflection: Inflection 3 Productivity", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS 120B", + "display_name": "GPT-OSS 120B", "modalities": { "input": [ "text" @@ -55061,28 +56121,34 @@ ] }, "limit": { - "context": 8000, - "output": 1024 + "context": 131000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2024-10-11", - "last_updated": "2026-03-15", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 2.5, - "output": 10 + "input": 0.15, + "output": 0.55 }, "type": "chat" }, { - "id": "liquid/lfm-2-24b-a2b", - "name": "LiquidAI: LFM2-24B-A2B", - "display_name": "LiquidAI: LFM2-24B-A2B", + "id": "zai-org/GLM-5.1-FP8", + "name": "GLM-5.1 FP8", + "display_name": "GLM-5.1 FP8", "modalities": { "input": [ "text" @@ -55092,39 +56158,52 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 202752, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-03-15", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.03, - "output": 0.12 + "input": 0.85, + "output": 3.3 }, "type": "chat" }, { - "id": "writer/palmyra-x5", - "name": "Writer: Palmyra X5", - "display_name": "Writer: Palmyra X5", + "id": "black-forest-labs/FLUX.2-klein-4B", + "name": "FLUX.2 Klein 4B", + "display_name": "FLUX.2 Klein 4B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 1040000, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": false, @@ -55132,19 +56211,19 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "open_weights": true, + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 0.6, - "output": 6 + "input": 1, + "output": 1 }, "type": "chat" }, { - "id": "ibm-granite/granite-4.1-8b", - "name": "IBM: Granite 4.1 8B", - "display_name": "IBM: Granite 4.1 8B", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen3 30B-A3B Instruct 2507", + "display_name": "Qwen3 30B-A3B Instruct 2507", "modalities": { "input": [ "text" @@ -55154,8 +56233,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -55163,20 +56242,19 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-05-01", + "open_weights": true, + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 0.05, - "output": 0.1, - "cache_read": 0.05 + "input": 0.15, + "output": 0.55 }, "type": "chat" }, { - "id": "ibm-granite/granite-4.0-h-micro", - "name": "IBM: Granite 4.0 Micro", - "display_name": "IBM: Granite 4.0 Micro", + "id": "Qwen/Qwen3-Embedding-0.6B", + "name": "Qwen3 Embedding 0.6B", + "display_name": "Qwen3 Embedding 0.6B", "modalities": { "input": [ "text" @@ -55186,28 +56264,28 @@ ] }, "limit": { - "context": 131000, - "output": 32768 + "context": 40960, + "output": 1024 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-10-20", - "last_updated": "2026-03-15", + "release_date": "2025-06-03", + "last_updated": "2025-06-03", "cost": { - "input": 0.017, - "output": 0.11 + "input": 0.01, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "essentialai/rnj-1-instruct", - "name": "EssentialAI: Rnj 1 Instruct", - "display_name": "EssentialAI: Rnj 1 Instruct", + "id": "Qwen/Qwen3-Reranker-0.6B", + "name": "Qwen3 Reranker 0.6B", + "display_name": "Qwen3 Reranker 0.6B", "modalities": { "input": [ "text" @@ -55217,28 +56295,28 @@ ] }, "limit": { - "context": 32768, - "output": 6554 + "context": 40960, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-05", - "last_updated": "2026-03-15", + "release_date": "2025-06-03", + "last_updated": "2025-06-03", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.01, + "output": 0.01 }, - "type": "chat" + "type": "rerank" }, { - "id": "perplexity/sonar-pro", - "name": "Perplexity: Sonar Pro", - "display_name": "Perplexity: Sonar Pro", + "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "name": "Qwen3-VL 30B-A3B Instruct", + "display_name": "Qwen3-VL 30B-A3B Instruct", "modalities": { "input": [ "text", @@ -55249,60 +56327,85 @@ ] }, "limit": { - "context": 200000, - "output": 8000 + "context": 256000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "open_weights": true, + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 3, - "output": 15 + "input": 0.15, + "output": 0.55 }, "type": "chat" }, { - "id": "perplexity/sonar-deep-research", - "name": "Perplexity: Sonar Deep Research", - "display_name": "Perplexity: Sonar Deep Research", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 25600 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-01-27", - "last_updated": "2025-01-27", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 2, - "output": 8 + "input": 1.8, + "output": 15.5, + "cache_read": 0.18 }, "type": "chat" }, { - "id": "perplexity/sonar", - "name": "Perplexity: Sonar", - "display_name": "Perplexity: Sonar", + "id": "openai/gpt-5.4-nano", + "name": "GPT-5.4 nano", + "display_name": "GPT-5.4 nano", "modalities": { "input": [ "text", @@ -55313,354 +56416,536 @@ ] }, "limit": { - "context": 127072, - "output": 25415 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 1, - "output": 1 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "perplexity/sonar-pro-search", - "name": "Perplexity: Sonar Pro Search", - "display_name": "Perplexity: Sonar Pro Search", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8000 + "context": 1047576, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-10-31", - "last_updated": "2026-03-15", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 3, - "output": 15 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "perplexity/sonar-reasoning-pro", - "name": "Perplexity: Sonar Reasoning Pro", - "display_name": "Perplexity: Sonar Reasoning Pro", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 25600 + "context": 1047576, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 2, - "output": 8 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "deepseek/deepseek-chat-v3.1", - "name": "DeepSeek: DeepSeek V3.1", - "display_name": "DeepSeek: DeepSeek V3.1", + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 7168 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.15, - "output": 0.75 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "deepseek/deepseek-chat", - "name": "DeepSeek: DeepSeek V3", - "display_name": "DeepSeek: DeepSeek V3", + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-12-01", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.32, - "output": 0.89, - "cache_read": 0.15 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-distill-llama-70b", - "name": "DeepSeek: R1 Distill Llama 70B", - "display_name": "DeepSeek: R1 Distill Llama 70B", + "id": "openai/gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1050000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-01-23", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.7, - "output": 0.8, - "cache_read": 0.015 + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + }, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "deepseek/deepseek-r1", - "name": "DeepSeek: R1", - "display_name": "DeepSeek: R1", + "id": "openai/gpt-5.4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.7, - "output": 2.5 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-speciale", - "name": "DeepSeek: DeepSeek V3.2 Speciale", - "display_name": "DeepSeek: DeepSeek V3.2 Speciale", + "id": "openai/gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 1050000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-01", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0.4, - "output": 1.2, - "cache_read": 0.135 + "input": 5, + "output": 30, + "cache_read": 0.5, + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + }, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-distill-qwen-32b", - "name": "DeepSeek: R1 Distill Qwen 32B", - "display_name": "DeepSeek: R1 Distill Qwen 32B", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 1047576, "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-01-01", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.29, - "output": 0.29 + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-exp", - "name": "DeepSeek: DeepSeek V3.2 Exp", - "display_name": "DeepSeek: DeepSeek V3.2 Exp", + "id": "openai/o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-01-01", - "last_updated": "2025-09-29", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.27, - "output": 0.41 + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-flash", - "name": "DeepSeek: DeepSeek V4 Flash", - "display_name": "DeepSeek: DeepSeek V4 Flash", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 384000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -55669,29 +56954,40 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-05-01", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.0028 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-pro", - "name": "DeepSeek: DeepSeek V4 Pro", - "display_name": "DeepSeek: DeepSeek V4 Pro", + "id": "openai/o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" @@ -55701,10 +56997,10 @@ ] }, "limit": { - "context": 1048576, - "output": 384000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -55713,42 +57009,48 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-05-01", + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 0.435, - "output": 0.87, - "cache_read": 0.003625 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2", - "name": "DeepSeek: DeepSeek V3.2", - "display_name": "DeepSeek: DeepSeek V3.2", + "id": "openai/o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -55756,68 +57058,103 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-01", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.26, - "output": 0.38, - "cache_read": 0.125 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "deepseek/deepseek-chat-v3-0324", - "name": "DeepSeek: DeepSeek V3 0324", - "display_name": "DeepSeek: DeepSeek V3 0324", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-03-24", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.2, - "output": 0.77, - "cache_read": 0.095 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-0528", - "name": "DeepSeek: R1 0528", - "display_name": "DeepSeek: R1 0528", + "id": "anthropic/claude-haiku-4-5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -55827,41 +57164,39 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-05-28", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.45, - "output": 2.15, - "cache_read": 0.2 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1-terminus", - "name": "DeepSeek: DeepSeek V3.1 Terminus", - "display_name": "DeepSeek: DeepSeek V3.1 Terminus", + "id": "anthropic/claude-sonnet-4-5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -55869,163 +57204,274 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.21, - "output": 0.79, - "cache_read": 0.13 + "input": 3, + "output": 15.5, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "openrouter/auto", - "name": "Auto Router", - "display_name": "Auto Router", + "id": "anthropic/claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image", + "pdf" ], "output": [ - "image", "text" ] }, "limit": { - "context": 2000000, - "output": 32768 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "openrouter/bodybuilder", - "name": "Body Builder (beta)", - "display_name": "Body Builder (beta)", + "id": "anthropic/claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1000000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openrouter/owl-alpha", - "name": "Owl Alpha", - "display_name": "Owl Alpha", + "id": "anthropic/claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 262144 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-04-28", - "last_updated": "2026-04-30", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openrouter/pareto-code", - "name": "Pareto Code Router", - "display_name": "Pareto Code Router", + "id": "google/gemini-3.1-flash-lite", + "name": "Gemini 3.1 Flash Lite", + "display_name": "Gemini 3.1 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 1048576, "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-04-21", - "last_updated": "2026-05-01", + "knowledge": "2025-01", + "release_date": "2026-05-07", + "last_updated": "2026-05-07", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "openrouter/free", - "name": "Free Models Router", - "display_name": "Free Models Router", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ + "text", "image", - "text" + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -56033,83 +57479,174 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-02-01", - "last_updated": "2026-03-15", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + }, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "inclusionai/ling-2.6-1t:free", - "name": "inclusionAI: Ling-2.6-1T (free)", - "display_name": "inclusionAI: Ling-2.6-1T (free)", + "id": "google/gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-04-23", - "last_updated": "2026-05-01", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.4, + "cache_read": 0.01, + "input_audio": 0.3 }, "type": "chat" }, { - "id": "inclusionai/ling-2.6-flash", - "name": "inclusionAI: Ling-2.6 Flash", - "display_name": "inclusionAI: Ling-2.6 Flash", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-04-21", - "last_updated": "2026-05-01", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.08, - "output": 0.24, - "cache_read": 0.016 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 }, "type": "chat" }, { - "id": "arcee-ai/trinity-mini", - "name": "Arcee AI: Trinity Mini", - "display_name": "Arcee AI: Trinity Mini", + "id": "Qwen/Qwen3.5-122B-A10B", + "name": "Qwen3.5 122B-A10B", + "display_name": "Qwen3.5 122B-A10B", "modalities": { "input": [ "text" @@ -56120,7 +57657,7 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -56128,54 +57665,79 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "release_date": "2025-12", - "last_updated": "2026-01-28", + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 0.045, - "output": 0.15 + "input": 0.4, + "output": 3.2 }, "type": "chat" - }, + } + ] + }, + "abacus": { + "id": "abacus", + "name": "Abacus", + "display_name": "Abacus", + "api": "https://routellm.abacus.ai/v1", + "doc": "https://abacus.ai/help/api", + "models": [ { - "id": "arcee-ai/virtuoso-large", - "name": "Arcee AI: Virtuoso Large", - "display_name": "Arcee AI: Virtuoso Large", + "id": "claude-opus-4-1-20250805", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 64000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-05-06", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.75, - "output": 1.2 + "input": 15, + "output": 75 }, "type": "chat" }, { - "id": "arcee-ai/trinity-large-thinking", - "name": "Arcee AI: Trinity Large Thinking", - "display_name": "Arcee AI: Trinity Large Thinking", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -56183,7 +57745,7 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -56191,287 +57753,395 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-11", + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.22, - "output": 0.85 + "input": 0.6, + "output": 3 }, "type": "chat" }, { - "id": "arcee-ai/spotlight", - "name": "Arcee AI: Spotlight", - "display_name": "Arcee AI: Spotlight", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65537 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-05-06", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.18, - "output": 0.18 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "arcee-ai/maestro-reasoning", - "name": "Arcee AI: Maestro Reasoning", - "display_name": "Arcee AI: Maestro Reasoning", + "id": "o3-pro", + "name": "o3-pro", + "display_name": "o3-pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32000 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-05-06", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", "cost": { - "input": 0.9, - "output": 3.3 + "input": 20, + "output": 40 }, "type": "chat" }, { - "id": "arcee-ai/coder-large", - "name": "Arcee AI: Coder Large", - "display_name": "Arcee AI: Coder Large", + "id": "claude-haiku-4-5-20251001", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-05-06", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.5, - "output": 0.8 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "arcee-ai/trinity-large-preview", - "name": "Arcee AI: Trinity Large Preview", - "display_name": "Arcee AI: Trinity Large Preview", + "id": "route-llm", + "name": "Route LLM", + "display_name": "Route LLM", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-01-28", - "last_updated": "2026-05-01", + "knowledge": "2024-10", + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 0.15, - "output": 0.45 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "deepcogito/cogito-v2.1-671b", - "name": "Deep Cogito: Cogito v2.1 671B", - "display_name": "Deep Cogito: Cogito v2.1 671B", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-11-14", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { "input": 1.25, - "output": 1.25 + "output": 10 }, "type": "chat" }, { - "id": "upstage/solar-pro-3", - "name": "Upstage: Solar Pro 3", - "display_name": "Upstage: Solar Pro 3", + "id": "grok-4-1-fast-non-reasoning", + "name": "Grok 4.1 Fast (Non-Reasoning)", + "display_name": "Grok 4.1 Fast (Non-Reasoning)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 2000000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-01-27", - "last_updated": "2026-03-15", + "release_date": "2025-11-17", + "last_updated": "2025-11-17", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "nex-agi/deepseek-v3.1-nex-n1", - "name": "Nex AGI: DeepSeek V3.1 Nex N1", - "display_name": "Nex AGI: DeepSeek V3.1 Nex N1", + "id": "grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 163840 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-11-25", + "release_date": "2025-09-01", + "last_updated": "2025-09-01", "cost": { - "input": 0.27, - "output": 1 + "input": 0.2, + "output": 1.5 }, "type": "chat" }, { - "id": "bytedance-seed/seed-1.6", - "name": "ByteDance Seed: Seed 1.6", - "display_name": "ByteDance Seed: Seed 1.6", + "id": "gpt-5-codex", + "name": "GPT-5 Codex", + "display_name": "GPT-5 Codex", "modalities": { "input": [ - "image", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-09", - "last_updated": "2025-09", + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.25, - "output": 2 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "bytedance-seed/seed-2.0-lite", - "name": "ByteDance Seed: Seed-2.0-Lite", - "display_name": "ByteDance Seed: Seed-2.0-Lite", + "id": "qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -56479,33 +58149,43 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2026-03-10", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.25, - "output": 2 + "input": 1.2, + "output": 6 }, "type": "chat" }, { - "id": "bytedance-seed/seed-1.6-flash", - "name": "ByteDance Seed: Seed 1.6 Flash", - "display_name": "ByteDance Seed: Seed 1.6 Flash", + "id": "grok-4-0709", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ - "image", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -56514,84 +58194,86 @@ "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2026-03-15", + "open_weights": false, + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.075, - "output": 0.3 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "bytedance-seed/seed-2.0-mini", - "name": "ByteDance Seed: Seed-2.0-Mini", - "display_name": "ByteDance Seed: Seed-2.0-Mini", + "id": "gpt-5.1-chat-latest", + "name": "GPT-5.1 Chat Latest", + "display_name": "GPT-5.1 Chat Latest", "modalities": { "input": [ - "image", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-27", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.1, - "output": 0.4 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "mancer/weaver", - "name": "Mancer: Weaver (alpha)", - "display_name": "Mancer: Weaver (alpha)", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 1047576, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2023-08-02", - "last_updated": "2026-03-15", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.75, - "output": 1 + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "anthracite-org/magnum-v4-72b", - "name": "Magnum v4 72B", - "display_name": "Magnum v4 72B", + "id": "llama-3.3-70b-versatile", + "name": "Llama 3.3 70B Versatile", + "display_name": "Llama 3.3 70B Versatile", "modalities": { "input": [ "text" @@ -56601,97 +58283,126 @@ ] }, "limit": { - "context": 16384, - "output": 2048 + "context": 128000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-10-22", - "last_updated": "2026-03-15", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 3, - "output": 5 + "input": 0.59, + "output": 0.79 }, "type": "chat" }, { - "id": "kilo-auto/balanced", - "name": "Kilo Auto Balanced", - "display_name": "Kilo Auto Balanced", + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 0.6, - "output": 3 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "kilo-auto/frontier", - "name": "Kilo Auto Frontier", - "display_name": "Kilo Auto Frontier", + "id": "gpt-4.1-mini", + "name": "GPT-4.1 Mini", + "display_name": "GPT-4.1 Mini", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 5, - "output": 25 + "input": 0.4, + "output": 1.6 }, "type": "chat" }, { - "id": "kilo-auto/small", - "name": "Kilo Auto Small", - "display_name": "Kilo Auto Small", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" @@ -56701,248 +58412,352 @@ "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.05, - "output": 0.4 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "kilo-auto/free", - "name": "Kilo Auto Free", - "display_name": "Kilo Auto Free", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 0.05, + "output": 0.4 }, "type": "chat" }, { - "id": "undi95/remm-slerp-l2-13b", - "name": "ReMM SLERP 13B", - "display_name": "ReMM SLERP 13B", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 6144, - "output": 4096 + "context": 1050000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2023-07-22", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.45, - "output": 0.65 + "input": 2.5, + "output": 15 }, "type": "chat" }, { - "id": "allenai/olmo-3-32b-think", - "name": "AllenAI: Olmo 3 32B Think", - "display_name": "AllenAI: Olmo 3 32B Think", + "id": "gpt-4o-mini", + "name": "GPT-4o Mini", + "display_name": "GPT-4o Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-11-22", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { "input": 0.15, - "output": 0.5 + "output": 0.6 }, "type": "chat" }, { - "id": "nousresearch/hermes-2-pro-llama-3-8b", - "name": "NousResearch: Hermes 2 Pro - Llama-3 8B", - "display_name": "NousResearch: Hermes 2 Pro - Llama-3 8B", + "id": "claude-opus-4-5-20251101", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-05-27", - "last_updated": "2024-06-27", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { - "input": 0.14, - "output": 0.14 + "input": 5, + "output": 25 }, "type": "chat" }, { - "id": "nousresearch/hermes-4-405b", - "name": "Nous: Hermes 4 405B", - "display_name": "Nous: Hermes 4 405B", + "id": "gpt-5.3-codex-xhigh", + "name": "GPT-5.3 Codex XHigh", + "display_name": "GPT-5.3 Codex XHigh", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-25", - "last_updated": "2025-08-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 1, - "output": 3 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "nousresearch/hermes-3-llama-3.1-70b", - "name": "Nous: Hermes 3 70B Instruct", - "display_name": "Nous: Hermes 3 70B Instruct", + "id": "claude-opus-4-20250514", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-08-18", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "release_date": "2025-05-14", + "last_updated": "2025-05-14", "cost": { - "input": 0.3, - "output": 0.3 + "input": 15, + "output": 75 }, "type": "chat" }, { - "id": "nousresearch/hermes-4-70b", - "name": "Nous: Hermes 4 70B", - "display_name": "Nous: Hermes 4 70B", + "id": "claude-sonnet-4-5-20250929", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-25", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.13, - "output": 0.4, - "cache_read": 0.055 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "nousresearch/hermes-3-llama-3.1-405b", - "name": "Nous: Hermes 3 405B Instruct", - "display_name": "Nous: Hermes 3 405B Instruct", + "id": "qwen-2.5-coder-32b", + "name": "Qwen 2.5 Coder 32B", + "display_name": "Qwen 2.5 Coder 32B", "modalities": { "input": [ "text" @@ -56952,133 +58767,195 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-08-16", - "last_updated": "2024-08-16", + "release_date": "2024-11-11", + "last_updated": "2024-11-11", "cost": { - "input": 1, - "output": 1 + "input": 0.79, + "output": 0.79 }, "type": "chat" }, { - "id": "morph/morph-v3-fast", - "name": "Morph: Morph V3 Fast", - "display_name": "Morph: Morph V3 Fast", + "id": "gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 81920, - "output": 38000 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "release_date": "2026-03-01", + "last_updated": "2026-03-01", "cost": { - "input": 0.8, - "output": 1.2 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "cache_write": 1 }, "type": "chat" }, { - "id": "morph/morph-v3-large", - "name": "Morph: Morph V3 Large", - "display_name": "Morph: Morph V3 Large", + "id": "gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.9, - "output": 1.9 + "input": 2, + "output": 12 }, "type": "chat" }, { - "id": "stepfun/step-3.5-flash:free", - "name": "StepFun: Step 3.5 Flash (free)", - "display_name": "StepFun: Step 3.5 Flash (free)", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2026-05-01", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "stepfun/step-3.5-flash", - "name": "StepFun: Step 3.5 Flash", - "display_name": "StepFun: Step 3.5 Flash", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -57086,114 +58963,155 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-01-29", - "last_updated": "2026-01-29", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.02 + "input": 0.5, + "output": 3 }, "type": "chat" }, { - "id": "alpindale/goliath-120b", - "name": "Goliath 120B", - "display_name": "Goliath 120B", + "id": "gpt-5.2-chat-latest", + "name": "GPT-5.2 Chat Latest", + "display_name": "GPT-5.2 Chat Latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 6144, - "output": 1024 + "context": 400000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2023-11-10", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2026-01-01", + "last_updated": "2026-01-01", "cost": { - "input": 3.75, - "output": 7.5 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "mistralai/mistral-nemo", - "name": "Mistral: Mistral Nemo", - "display_name": "Mistral: Mistral Nemo", + "id": "gpt-4.1-nano", + "name": "GPT-4.1 Nano", + "display_name": "GPT-4.1 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-01", - "last_updated": "2024-07-30", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.02, - "output": 0.04 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "mistralai/mistral-saba", - "name": "Mistral: Saba", - "display_name": "Mistral: Saba", + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-02-17", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.2, - "output": 0.6 + "input": 1.1, + "output": 4.4 }, "type": "chat" }, { - "id": "mistralai/mistral-large-2512", - "name": "Mistral: Mistral Large 3 2512", - "display_name": "Mistral: Mistral Large 3 2512", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ "text", @@ -57204,104 +59122,156 @@ ] }, "limit": { - "context": 262144, - "output": 52429 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "release_date": "2024-11-01", - "last_updated": "2025-12-16", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.5, - "output": 1.5 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "mistralai/devstral-medium", - "name": "Mistral: Devstral Medium", - "display_name": "Mistral: Devstral Medium", + "id": "gpt-4o-2024-11-20", + "name": "GPT-4o (2024-11-20)", + "display_name": "GPT-4o (2024-11-20)", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-10", - "last_updated": "2025-07-10", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", "cost": { - "input": 0.4, - "output": 2 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "mistralai/mistral-small-3.1-24b-instruct", - "name": "Mistral: Mistral Small 3.1 24B", - "display_name": "Mistral: Mistral Small 3.1 24B", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-17", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.35, - "output": 0.56, - "cache_read": 0.015 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "mistralai/mistral-medium-3-5", - "name": "Mistral: Mistral Medium 3.5", - "display_name": "Mistral: Mistral Medium 3.5", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ + "text", "image", - "text" + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -57309,52 +59279,96 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-05-07", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 1.5, - "output": 7.5 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "mistralai/pixtral-large-2411", - "name": "Mistral: Pixtral Large 2411", - "display_name": "Mistral: Pixtral Large 2411", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "release_date": "2024-11-19", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 2, - "output": 6 + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "mistralai/devstral-2512", - "name": "Mistral: Devstral 2 2512", - "display_name": "Mistral: Devstral 2 2512", + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" @@ -57364,196 +59378,310 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "release_date": "2025-09-12", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.025 + "input": 1.1, + "output": 4.4 }, "type": "chat" }, { - "id": "mistralai/codestral-2508", - "name": "Mistral: Codestral 2508", - "display_name": "Mistral: Codestral 2508", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 51200 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-01", - "last_updated": "2025-08-01", - "cost": { - "input": 0.3, - "output": 0.9 + "supported": true, + "default": true }, - "type": "chat" + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "cost": { + "input": 1.75, + "output": 14 + }, + "type": "chat" }, { - "id": "mistralai/mistral-small-24b-instruct-2501", - "name": "Mistral: Mistral Small 3", - "display_name": "Mistral: Mistral Small 3", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-01-10", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.05, - "output": 0.08 + "input": 5, + "output": 25 }, "type": "chat" }, { - "id": "mistralai/mistral-large-2411", - "name": "Mistral Large 2411", - "display_name": "Mistral Large 2411", + "id": "claude-3-7-sonnet-20250219", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-24", - "last_updated": "2024-11-04", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 2, - "output": 6 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "mistralai/mixtral-8x22b-instruct", - "name": "Mistral: Mixtral 8x22B Instruct", - "display_name": "Mistral: Mixtral 8x22B Instruct", + "id": "o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 13108 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-17", - "last_updated": "2024-04-17", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { "input": 2, - "output": 6 + "output": 8 }, "type": "chat" }, { - "id": "mistralai/mistral-large-2407", - "name": "Mistral Large 2407", - "display_name": "Mistral Large 2407", + "id": "claude-sonnet-4-20250514", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-11-19", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "release_date": "2025-05-14", + "last_updated": "2025-05-14", "cost": { - "input": 2, - "output": 6 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "mistralai/ministral-8b-2512", - "name": "Mistral: Ministral 3 8B 2512", - "display_name": "Mistral: Ministral 3 8B 2512", + "id": "grok-4-fast-non-reasoning", + "name": "Grok 4 Fast (Non-Reasoning)", + "display_name": "Grok 4 Fast (Non-Reasoning)", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 2000000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -57561,149 +59689,181 @@ "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2026-03-15", + "open_weights": false, + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "mistralai/mistral-medium-3.1", - "name": "Mistral: Mistral Medium 3.1", - "display_name": "Mistral: Mistral Medium 3.1", + "id": "kimi-k2-turbo-preview", + "name": "Kimi K2 Turbo Preview", + "display_name": "Kimi K2 Turbo Preview", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-12", - "last_updated": "2025-08-12", + "release_date": "2025-07-08", + "last_updated": "2025-07-08", "cost": { - "input": 0.4, - "output": 2 + "input": 0.15, + "output": 8 }, "type": "chat" }, { - "id": "mistralai/mistral-small-2603", - "name": "Mistral: Mistral Small 4", - "display_name": "Mistral: Mistral Small 4", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, - "open_weights": true, - "release_date": "2026-03-16", - "last_updated": "2026-04-11", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.015 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "mistralai/ministral-3b-2512", - "name": "Mistral: Ministral 3 3B 2512", - "display_name": "Mistral: Ministral 3 3B 2512", + "id": "gpt-5.3-chat-latest", + "name": "GPT-5.3 Chat Latest", + "display_name": "GPT-5.3 Chat Latest", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2026-03-15", + "open_weights": false, + "release_date": "2026-03-01", + "last_updated": "2026-03-01", "cost": { - "input": 0.1, - "output": 0.1 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "mistralai/voxtral-small-24b-2507", - "name": "Mistral: Voxtral Small 24B 2507", - "display_name": "Mistral: Voxtral Small 24B 2507", + "id": "deepseek-ai/DeepSeek-R1", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ - "text", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 6400 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.1, - "output": 0.3 + "input": 3, + "output": 7 }, "type": "chat" }, { - "id": "mistralai/mixtral-8x7b-instruct", - "name": "Mistral: Mixtral 8x7B Instruct", - "display_name": "Mistral: Mixtral 8x7B Instruct", + "id": "deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ "text" @@ -57713,93 +59873,104 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2023-12-10", - "last_updated": "2026-03-15", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 0.54, - "output": 0.54 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "mistralai/mistral-medium-3", - "name": "Mistral: Mistral Medium 3", - "display_name": "Mistral: Mistral Medium 3", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-06-15", + "last_updated": "2025-06-15", "cost": { - "input": 0.4, - "output": 2 + "input": 0.27, + "output": 0.4 }, "type": "chat" }, { - "id": "mistralai/mistral-small-3.2-24b-instruct", - "name": "Mistral: Mistral Small 3.2 24B", - "display_name": "Mistral: Mistral Small 3.2 24B", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS 120B", + "display_name": "GPT-OSS 120B", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": true, - "release_date": "2025-06-20", - "last_updated": "2025-06-20", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.06, - "output": 0.18, - "cache_read": 0.03 + "input": 0.08, + "output": 0.44 }, "type": "chat" }, { - "id": "mistralai/devstral-small", - "name": "Mistral: Devstral Small 1.1", - "display_name": "Mistral: Devstral Small 1.1", + "id": "zai-org/glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -57809,28 +59980,33 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2025-05-07", - "last_updated": "2025-07-10", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "mistralai/mistral-large", - "name": "Mistral Large", - "display_name": "Mistral Large", + "id": "zai-org/glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -57841,27 +60017,28 @@ }, "limit": { "context": 128000, - "output": 25600 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-07-24", - "last_updated": "2025-12-02", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 2, - "output": 6 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "mistralai/mistral-7b-instruct-v0.1", - "name": "Mistral: Mistral 7B Instruct v0.1", - "display_name": "Mistral: Mistral 7B Instruct v0.1", + "id": "zai-org/glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -57871,60 +60048,82 @@ ] }, "limit": { - "context": 2824, - "output": 565 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-03", - "last_updated": "2025-04-03", + "open_weights": true, + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 0.11, - "output": 0.19 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "mistralai/ministral-14b-2512", - "name": "Mistral: Ministral 3 14B 2512", - "display_name": "Mistral: Ministral 3 14B 2512", + "id": "zai-org/glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 52429 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.2, - "output": 0.2 + "input": 1, + "output": 3.2 }, "type": "chat" }, { - "id": "meta-llama/llama-3.3-70b-instruct", - "name": "Meta: Llama 3.3 70B Instruct", - "display_name": "Meta: Llama 3.3 70B Instruct", + "id": "deepseek/deepseek-v3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text" @@ -57934,60 +60133,60 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-08-01", - "last_updated": "2026-02-04", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.1, - "output": 0.32 + "input": 0.55, + "output": 1.66 }, "type": "chat" }, { - "id": "meta-llama/llama-4-scout", - "name": "Meta: Llama 4 Scout", - "display_name": "Meta: Llama 4 Scout", + "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 327680, - "output": 16384 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.08, - "output": 0.3 + "input": 0.02, + "output": 0.05 }, "type": "chat" }, { - "id": "meta-llama/llama-guard-3-8b", - "name": "Llama Guard 3 8B", - "display_name": "Llama Guard 3 8B", + "id": "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo", + "name": "Llama 3.1 405B Instruct Turbo", + "display_name": "Llama 3.1 405B Instruct Turbo", "modalities": { "input": [ "text" @@ -57997,28 +60196,28 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-04-18", - "last_updated": "2026-02-04", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.02, - "output": 0.06 + "input": 3.5, + "output": 3.5 }, "type": "chat" }, { - "id": "meta-llama/llama-4-maverick", - "name": "Meta: Llama 4 Maverick", - "display_name": "Meta: Llama 4 Maverick", + "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", "modalities": { "input": [ "text", @@ -58029,8 +60228,8 @@ ] }, "limit": { - "context": 1048576, - "output": 16384 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -58039,53 +60238,64 @@ }, "attachment": true, "open_weights": true, + "knowledge": "2024-08", "release_date": "2025-04-05", - "last_updated": "2025-12-24", + "last_updated": "2025-04-05", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.14, + "output": 0.59 }, "type": "chat" }, { - "id": "meta-llama/llama-3.2-11b-vision-instruct", - "name": "Meta: Llama 3.2 11B Vision Instruct", - "display_name": "Meta: Llama 3.2 11B Vision Instruct", + "id": "Qwen/Qwen3-32B", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.049, - "output": 0.049 + "input": 0.09, + "output": 0.29 }, "type": "chat" }, { - "id": "meta-llama/llama-guard-4-12b", - "name": "Meta: Llama Guard 4 12B", - "display_name": "Meta: Llama Guard 4 12B", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct", + "display_name": "Qwen3 235B A22B Instruct", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -58093,28 +60303,29 @@ ] }, "limit": { - "context": 163840, - "output": 32768 + "context": 262144, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.18, - "output": 0.18 + "input": 0.13, + "output": 0.6 }, "type": "chat" }, { - "id": "meta-llama/llama-3.1-70b-instruct", - "name": "Meta: Llama 3.1 70B Instruct", - "display_name": "Meta: Llama 3.1 70B Instruct", + "id": "Qwen/QwQ-32B", + "name": "QwQ 32B", + "display_name": "QwQ 32B", "modalities": { "input": [ "text" @@ -58124,18 +60335,30 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2024-07-16", - "last_updated": "2024-07-23", + "release_date": "2024-11-28", + "last_updated": "2024-11-28", "cost": { "input": 0.4, "output": 0.4 @@ -58143,9 +60366,9 @@ "type": "chat" }, { - "id": "meta-llama/llama-3.2-1b-instruct", - "name": "Meta: Llama 3.2 1B Instruct", - "display_name": "Meta: Llama 3.2 1B Instruct", + "id": "Qwen/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -58155,28 +60378,29 @@ ] }, "limit": { - "context": 60000, - "output": 12000 + "context": 262144, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-09-18", - "last_updated": "2026-01-27", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", "cost": { - "input": 0.027, - "output": 0.2 + "input": 0.29, + "output": 1.2 }, "type": "chat" }, { - "id": "meta-llama/llama-3.2-3b-instruct", - "name": "Meta: Llama 3.2 3B Instruct", - "display_name": "Meta: Llama 3.2 3B Instruct", + "id": "Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen 2.5 72B Instruct", + "display_name": "Qwen 2.5 72B Instruct", "modalities": { "input": [ "text" @@ -58186,90 +60410,102 @@ ] }, "limit": { - "context": 80000, - "output": 16384 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-09-18", - "last_updated": "2026-03-15", + "release_date": "2024-09-19", + "last_updated": "2024-09-19", "cost": { - "input": 0.051, - "output": 0.34 + "input": 0.11, + "output": 0.38 }, "type": "chat" - }, + } + ] + }, + "privatemode-ai": { + "id": "privatemode-ai", + "name": "Privatemode AI", + "display_name": "Privatemode AI", + "api": "http://localhost:8080/v1", + "doc": "https://docs.privatemode.ai/api/overview", + "models": [ { - "id": "meta-llama/llama-3-8b-instruct", - "name": "Meta: Llama 3 8B Instruct", - "display_name": "Meta: Llama 3 8B Instruct", + "id": "gemma-3-27b", + "name": "Gemma 3 27B", + "display_name": "Gemma 3 27B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 16384 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2024-04-25", - "last_updated": "2025-04-03", + "knowledge": "2024-08", + "release_date": "2025-03-12", + "last_updated": "2025-03-12", "cost": { - "input": 0.03, - "output": 0.04 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta-llama/llama-3.1-8b-instruct", - "name": "Meta: Llama 3.1 8B Instruct", - "display_name": "Meta: Llama 3.1 8B Instruct", + "id": "whisper-large-v3", + "name": "Whisper large-v3", + "display_name": "Whisper large-v3", "modalities": { "input": [ - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 8192, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2025-12-23", + "knowledge": "2023-09", + "release_date": "2023-09-01", + "last_updated": "2023-09-01", "cost": { - "input": 0.02, - "output": 0.05 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta-llama/llama-3-70b-instruct", - "name": "Meta: Llama 3 70B Instruct", - "display_name": "Meta: Llama 3 70B Instruct", + "id": "qwen3-embedding-4b", + "name": "Qwen3-Embedding 4B", + "display_name": "Qwen3-Embedding 4B", "modalities": { "input": [ "text" @@ -58279,8 +60515,8 @@ ] }, "limit": { - "context": 8192, - "output": 8000 + "context": 32000, + "output": 2560 }, "temperature": true, "tool_call": false, @@ -58289,22 +60525,21 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2025-06", + "release_date": "2025-06-06", + "last_updated": "2025-06-06", "cost": { - "input": 0.51, - "output": 0.74 + "input": 0, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "x-ai/grok-4.20", - "name": "xAI: Grok 4.20", - "display_name": "xAI: Grok 4.20", + "id": "qwen3-coder-30b-a3b", + "name": "Qwen3-Coder 30B-A3B", + "display_name": "Qwen3-Coder 30B-A3B", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -58312,30 +60547,29 @@ ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-31", - "last_updated": "2026-04-11", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "x-ai/grok-code-fast-1:optimized:free", - "name": "xAI: Grok Code Fast 1 Optimized (experimental, free)", - "display_name": "xAI: Grok Code Fast 1 Optimized (experimental, free)", + "id": "gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ "text" @@ -58345,8 +60579,8 @@ ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -58354,33 +60588,46 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-27", - "last_updated": "2026-03-15", + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-08-04", + "last_updated": "2025-08-14", "cost": { "input": 0, "output": 0 }, "type": "chat" - }, + } + ] + }, + "minimax-cn-coding-plan": { + "id": "minimax-cn-coding-plan", + "name": "MiniMax Token Plan (minimaxi.com)", + "display_name": "MiniMax Token Plan (minimaxi.com)", + "api": "https://api.minimaxi.com/anthropic/v1", + "doc": "https://platform.minimaxi.com/docs/token-plan/intro", + "models": [ { - "id": "x-ai/grok-4.3", - "name": "xAI: Grok 4.3", - "display_name": "xAI: Grok 4.3", + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -58393,33 +60640,31 @@ "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-05-01", - "last_updated": "2026-05-01", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "x-ai/grok-4-fast", - "name": "xAI: Grok 4 Fast", - "display_name": "xAI: Grok 4 Fast", + "id": "MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -58427,21 +60672,33 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-19", - "last_updated": "2025-08-19", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "x-ai/grok-code-fast-1", - "name": "xAI: Grok Code Fast 1", - "display_name": "xAI: Grok Code Fast 1", + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -58451,8 +60708,8 @@ ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -58466,20 +60723,21 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "x-ai/grok-3-beta", - "name": "xAI: Grok 3 Beta", - "display_name": "xAI: Grok 3 Beta", + "id": "MiniMax-M2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ "text" @@ -58489,32 +60747,44 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "x-ai/grok-4", - "name": "xAI: Grok 4", - "display_name": "xAI: Grok 4", + "id": "MiniMax-M2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "display_name": "MiniMax-M2.5-highspeed", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -58522,8 +60792,8 @@ ] }, "limit": { - "context": 256000, - "output": 51200 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -58536,21 +60806,22 @@ "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "x-ai/grok-3-mini", - "name": "xAI: Grok 3 Mini", - "display_name": "xAI: Grok 3 Mini", + "id": "MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ "text" @@ -58560,8 +60831,8 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 196608, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -58569,66 +60840,78 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, - "open_weights": false, - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 0.3, - "output": 0.5, - "cache_read": 0.075 + "input": 0, + "output": 0 }, "type": "chat" - }, + } + ] + }, + "xiaomi-token-plan-ams": { + "id": "xiaomi-token-plan-ams", + "name": "Xiaomi Token Plan (Europe)", + "display_name": "Xiaomi Token Plan (Europe)", + "api": "https://token-plan-ams.xiaomimimo.com/v1", + "doc": "https://platform.xiaomimimo.com/#/docs", + "models": [ { - "id": "x-ai/grok-4.1-fast", - "name": "xAI: Grok 4.1 Fast", - "display_name": "xAI: Grok 4.1 Fast", + "id": "mimo-v2-tts", + "name": "MiMo-V2-TTS", + "display_name": "MiMo-V2-TTS", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 8192, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "x-ai/grok-3-mini-beta", - "name": "xAI: Grok 3 Mini Beta", - "display_name": "xAI: Grok 3 Mini Beta", + "id": "mimo-v2.5", + "name": "MiMo-V2.5", + "display_name": "MiMo-V2.5", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -58636,25 +60919,35 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.3, - "output": 0.5, - "cache_read": 0.075 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "x-ai/grok-4.20-multi-agent", - "name": "xAI: Grok 4.20 Multi-Agent", - "display_name": "xAI: Grok 4.20 Multi-Agent", + "id": "mimo-v2-pro", + "name": "MiMo-V2-Pro", + "display_name": "MiMo-V2-Pro", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -58662,30 +60955,42 @@ ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 1048576, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "release_date": "2026-03-31", - "last_updated": "2026-04-11", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "x-ai/grok-3", - "name": "xAI: Grok 3", - "display_name": "xAI: Grok 3", + "id": "mimo-v2-flash", + "name": "MiMo-V2-Flash", + "display_name": "MiMo-V2-Flash", "modalities": { "input": [ "text" @@ -58695,29 +61000,42 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "open_weights": true, + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "tencent/hy3-preview:free", - "name": "Tencent: Hy3 Preview (free)", - "display_name": "Tencent: Hy3 Preview (free)", + "id": "mimo-v2.5-pro", + "name": "MiMo-V2.5-Pro", + "display_name": "MiMo-V2.5-Pro", "modalities": { "input": [ "text" @@ -58727,8 +61045,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -58736,52 +61054,91 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, + "open_weights": true, + "knowledge": "2024-12", "release_date": "2026-04-22", - "last_updated": "2026-05-01", + "last_updated": "2026-04-22", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "tencent/hunyuan-a13b-instruct", - "name": "Tencent: Hunyuan A13B Instruct", - "display_name": "Tencent: Hunyuan A13B Instruct", + "id": "mimo-v2-omni", + "name": "MiMo-V2-Omni", + "display_name": "MiMo-V2-Omni", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 262144, "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-06-30", - "last_updated": "2025-11-25", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" - }, + } + ] + }, + "cloudferro-sherlock": { + "id": "cloudferro-sherlock", + "name": "CloudFerro Sherlock", + "display_name": "CloudFerro Sherlock", + "api": "https://api-sherlock.cloudferro.com/openai/v1/", + "doc": "https://docs.sherlock.cloudferro.com/", + "models": [ { - "id": "gryphe/mythomax-l2-13b", - "name": "MythoMax 13B", - "display_name": "MythoMax 13B", + "id": "openai/gpt-oss-120b", + "name": "OpenAI GPT OSS 120B", + "display_name": "OpenAI GPT OSS 120B", "modalities": { "input": [ "text" @@ -58791,28 +61148,34 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 131000, + "output": 131000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2024-04-25", - "last_updated": "2024-04-25", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0.06, - "output": 0.06 + "input": 2.92, + "output": 2.92 }, "type": "chat" }, { - "id": "sao10k/l3-euryale-70b", - "name": "Sao10k: Llama 3 Euryale 70B v2.1", - "display_name": "Sao10k: Llama 3 Euryale 70B v2.1", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -58822,8 +61185,8 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 70000, + "output": 70000 }, "temperature": true, "tool_call": true, @@ -58832,18 +61195,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-06-18", - "last_updated": "2026-03-15", + "knowledge": "2024-10-09", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 1.48, - "output": 1.48 + "input": 2.92, + "output": 2.92 }, "type": "chat" }, { - "id": "sao10k/l3-lunaris-8b", - "name": "Sao10K: Llama 3 8B Lunaris", - "display_name": "Sao10K: Llama 3 8B Lunaris", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -58853,28 +61217,35 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 196000, + "output": 16000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2024-08-13", - "last_updated": "2026-03-15", + "knowledge": "2026-01", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.04, - "output": 0.05 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "sao10k/l3.3-euryale-70b", - "name": "Sao10K: Llama 3.3 Euryale 70B", - "display_name": "Sao10K: Llama 3.3 Euryale 70B", + "id": "speakleash/Bielik-11B-v2.6-Instruct", + "name": "Bielik 11B v2.6 Instruct", + "display_name": "Bielik 11B v2.6 Instruct", "modalities": { "input": [ "text" @@ -58884,28 +61255,29 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 32000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-12-18", - "last_updated": "2026-03-15", + "knowledge": "2025-03", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 0.65, - "output": 0.75 + "input": 0.67, + "output": 0.67 }, "type": "chat" }, { - "id": "sao10k/l3.1-70b-hanami-x1", - "name": "Sao10K: Llama 3.1 70B Hanami x1", - "display_name": "Sao10K: Llama 3.1 70B Hanami x1", + "id": "speakleash/Bielik-11B-v3.0-Instruct", + "name": "Bielik 11B v3.0 Instruct", + "display_name": "Bielik 11B v3.0 Instruct", "modalities": { "input": [ "text" @@ -58915,28 +61287,37 @@ ] }, "limit": { - "context": 16000, - "output": 16000 + "context": 32000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-01-08", - "last_updated": "2026-03-15", + "knowledge": "2025-03", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 3, - "output": 3 + "input": 0.67, + "output": 0.67 }, "type": "chat" - }, + } + ] + }, + "openai": { + "id": "openai", + "name": "OpenAI", + "display_name": "OpenAI", + "doc": "https://platform.openai.com/docs/models", + "models": [ { - "id": "sao10k/l3.1-euryale-70b", - "name": "Sao10K: Llama 3.1 Euryale 70B v2.2", - "display_name": "Sao10K: Llama 3.1 Euryale 70B v2.2", + "id": "text-embedding-3-large", + "name": "text-embedding-3-large", + "display_name": "text-embedding-3-large", "modalities": { "input": [ "text" @@ -58946,122 +61327,150 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 8191, + "output": 3072 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-08-28", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2024-01", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0.85, - "output": 0.85 + "input": 0.13, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "microsoft/wizardlm-2-8x22b", - "name": "WizardLM-2 8x22B", - "display_name": "WizardLM-2 8x22B", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 65535, - "output": 8000 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-24", - "last_updated": "2024-04-24", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 0.62, - "output": 0.62 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "microsoft/phi-4-mini-instruct", - "name": "Microsoft: Phi 4 Mini Instruct", - "display_name": "Microsoft: Phi 4 Mini Instruct", + "id": "gpt-image-1-mini", + "name": "gpt-image-1-mini", + "display_name": "gpt-image-1-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8192, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-10-17", - "last_updated": "2026-05-07", - "cost": { - "input": 0.08, - "output": 0.35, - "cache_read": 0.08 - }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-09-26", + "last_updated": "2025-09-26", + "type": "imageGeneration" }, { - "id": "microsoft/phi-4", - "name": "Microsoft: Phi 4", - "display_name": "Microsoft: Phi 4", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.06, - "output": 0.14 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "poolside/laguna-m.1:free", - "name": "Poolside: Laguna M.1 (free)", - "display_name": "Poolside: Laguna M.1 (free)", + "id": "gpt-3.5-turbo", + "name": "GPT-3.5-turbo", + "display_name": "GPT-3.5-turbo", "modalities": { "input": [ "text" @@ -59071,61 +61480,78 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 16385, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-04-28", - "last_updated": "2026-05-01", + "knowledge": "2021-09-01", + "release_date": "2023-03-01", + "last_updated": "2023-11-06", "cost": { - "input": 0, - "output": 0 + "input": 0.5, + "output": 1.5, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "poolside/laguna-xs.2:free", - "name": "Poolside: Laguna XS.2 (free)", - "display_name": "Poolside: Laguna XS.2 (free)", + "id": "o3-pro", + "name": "o3-pro", + "display_name": "o3-pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-04-28", - "last_updated": "2026-05-01", + "knowledge": "2024-05", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", "cost": { - "input": 0, - "output": 0 + "input": 20, + "output": 80 }, "type": "chat" }, { - "id": "cohere/command-r7b-12-2024", - "name": "Cohere: Command R7B (12-2024)", - "display_name": "Cohere: Command R7B (12-2024)", + "id": "o1-preview", + "name": "o1-preview", + "display_name": "o1-preview", "modalities": { "input": [ "text" @@ -59136,89 +61562,135 @@ }, "limit": { "context": 128000, - "output": 4000 + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "release_date": "2024-02-27", - "last_updated": "2024-02-27", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 0.0375, - "output": 0.15 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "cohere/command-a", - "name": "Cohere: Command A", - "display_name": "Cohere: Command A", + "id": "gpt-5.4-nano", + "name": "GPT-5.4 nano", + "display_name": "GPT-5.4 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 2.5, - "output": 10 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "cohere/command-r-plus-08-2024", - "name": "Cohere: Command R+ (08-2024)", - "display_name": "Cohere: Command R+ (08-2024)", + "id": "gpt-5-chat-latest", + "name": "GPT-5 Chat (latest)", + "display_name": "GPT-5 Chat (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 400000, + "output": 128000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 2.5, + "input": 1.25, "output": 10 }, "type": "chat" }, { - "id": "cohere/command-r-08-2024", - "name": "Cohere: Command R (08-2024)", - "display_name": "Cohere: Command R (08-2024)", + "id": "text-embedding-ada-002", + "name": "text-embedding-ada-002", + "display_name": "text-embedding-ada-002", "modalities": { "input": [ "text" @@ -59228,320 +61700,312 @@ ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "open_weights": false, + "knowledge": "2022-12", + "release_date": "2022-12-15", + "last_updated": "2022-12-15", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.1, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "prime-intellect/intellect-3", - "name": "Prime Intellect: INTELLECT-3", - "display_name": "Prime Intellect: INTELLECT-3", + "id": "gpt-5.5-pro", + "name": "GPT-5.5 Pro", + "display_name": "GPT-5.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-11-26", - "last_updated": "2026-02-04", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0.2, - "output": 1.1 + "input": 30, + "output": 180, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 60, + "output": 270 + } }, "type": "chat" }, { - "id": "nvidia/llama-3.3-nemotron-super-49b-v1.5", - "name": "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5", - "display_name": "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex mini", + "display_name": "GPT-5.1 Codex mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-03-16", - "last_updated": "2025-03-16", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-super-120b-a12b", - "name": "NVIDIA: Nemotron 3 Super", - "display_name": "NVIDIA: Nemotron 3 Super", + "id": "gpt-5.2-pro", + "name": "GPT-5.2 Pro", + "display_name": "GPT-5.2 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-11", - "last_updated": "2026-04-11", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.1, - "output": 0.5, - "cache_read": 0.1 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free", - "name": "NVIDIA: Nemotron 3 Nano Omni (free)", - "display_name": "NVIDIA: Nemotron 3 Nano Omni (free)", + "id": "gpt-4o-2024-05-13", + "name": "GPT-4o (2024-05-13)", + "display_name": "GPT-4o (2024-05-13)", "modalities": { "input": [ "text", - "audio", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-04-28", - "last_updated": "2026-05-01", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 15 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-nano-30b-a3b", - "name": "NVIDIA: Nemotron 3 Nano 30B A3B", - "display_name": "NVIDIA: Nemotron 3 Nano 30B A3B", + "id": "chatgpt-image-latest", + "name": "chatgpt-image-latest", + "display_name": "chatgpt-image-latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 262144, - "output": 52429 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-12", - "last_updated": "2026-02-04", - "cost": { - "input": 0.05, - "output": 0.2 + "supported": false }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "type": "chat" }, { - "id": "nvidia/nemotron-3-super-120b-a12b:free", - "name": "NVIDIA: Nemotron 3 Super (free)", - "display_name": "NVIDIA: Nemotron 3 Super (free)", + "id": "gpt-5.3-codex-spark", + "name": "GPT-5.3 Codex Spark", + "display_name": "GPT-5.3 Codex Spark", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 32000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-12", - "last_updated": "2026-03-15", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - }, - { - "id": "nvidia/nemotron-nano-9b-v2", - "name": "NVIDIA: Nemotron Nano 9B V2", - "display_name": "NVIDIA: Nemotron Nano 9B V2", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 26215 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-18", - "last_updated": "2025-08-18", - "cost": { - "input": 0.04, - "output": 0.16 - }, - "type": "chat" - }, - { - "id": "nvidia/llama-3.1-nemotron-70b-instruct", - "name": "NVIDIA: Llama 3.1 Nemotron 70B Instruct", - "display_name": "NVIDIA: Llama 3.1 Nemotron 70B Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 16384 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-10-12", - "last_updated": "2024-10-12", - "cost": { - "input": 1.2, - "output": 1.2 - }, - "type": "chat" - }, - { - "id": "inception/mercury-2", - "name": "Inception: Mercury 2", - "display_name": "Inception: Mercury 2", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 50000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.25, - "output": 0.75, - "cache_read": 0.025 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-max", - "name": "OpenAI: GPT-5.1-Codex-Max", - "display_name": "OpenAI: GPT-5.1-Codex-Max", + "id": "gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ "text", @@ -59559,16 +62023,16 @@ "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", + "minimal", "low", "medium", "high" @@ -59582,10 +62046,11 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { "input": 1.25, "output": 10, @@ -59594,14 +62059,13 @@ "type": "chat" }, { - "id": "openai/gpt-5.2-chat", - "name": "OpenAI: GPT-5.2 Chat", - "display_name": "OpenAI: GPT-5.2 Chat", + "id": "gpt-5.1-chat-latest", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" @@ -59614,67 +62078,38 @@ "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2026-03-15", - "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 - }, - "type": "chat" - }, - { - "id": "openai/gpt-4o-mini-search-preview", - "name": "OpenAI: GPT-4o-mini Search Preview", - "display_name": "OpenAI: GPT-4o-mini Search Preview", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 16384 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-01", - "last_updated": "2025-01", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.15, - "output": 0.6 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai/gpt-5-chat", - "name": "OpenAI: GPT-5 Chat", - "display_name": "OpenAI: GPT-5 Chat", + "id": "gpt-image-1.5", + "name": "gpt-image-1.5", + "display_name": "gpt-image-1.5", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8192, + "output": 8192 }, "temperature": false, "tool_call": false, @@ -59683,32 +62118,27 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2026-03-15", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, - "type": "chat" + "release_date": "2025-11-25", + "last_updated": "2025-11-25", + "type": "imageGeneration" }, { - "id": "openai/gpt-4o-2024-05-13", - "name": "OpenAI: GPT-4o (2024-05-13)", - "display_name": "OpenAI: GPT-4o (2024-05-13)", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -59717,22 +62147,22 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2026-03-15", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 5, - "output": 15 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "openai/gpt-5.3-chat", - "name": "OpenAI: GPT-5.3 Chat", - "display_name": "OpenAI: GPT-5.3 Chat", + "id": "text-embedding-3-small", + "name": "text-embedding-3-small", + "display_name": "text-embedding-3-small", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -59740,32 +62170,33 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8191, + "output": 1536 }, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-04", - "last_updated": "2026-03-15", + "knowledge": "2024-01", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 1.75, - "output": 14 + "input": 0.02, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "openai/gpt-5.2-pro", - "name": "OpenAI: GPT-5.2 Pro", - "display_name": "OpenAI: GPT-5.2 Pro", + "id": "gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" @@ -59773,7 +62204,7 @@ }, "limit": { "context": 400000, - "output": 128000 + "output": 272000 }, "temperature": false, "tool_call": true, @@ -59785,13 +62216,8 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", + "mode": "fixed", "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], "verbosity": "medium", "verbosity_options": [ "low", @@ -59803,54 +62229,58 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2026-03-15", + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 21, - "output": 168 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "openai/gpt-4-1106-preview", - "name": "OpenAI: GPT-4 Turbo (older v1106)", - "display_name": "OpenAI: GPT-4 Turbo (older v1106)", + "id": "gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2023-11-06", - "last_updated": "2026-03-15", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 10, - "output": 30 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "openai/gpt-chat-latest", - "name": "OpenAI: GPT Chat Latest", - "display_name": "OpenAI: GPT Chat Latest", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" @@ -59864,73 +62294,56 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-05-05", - "last_updated": "2026-05-07", - "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5 - }, - "type": "chat" - }, - { - "id": "openai/gpt-4o-audio-preview", - "name": "OpenAI: GPT-4o Audio", - "display_name": "OpenAI: GPT-4o Audio", - "modalities": { - "input": [ - "audio", - "text" - ], - "output": [ - "audio", - "text" - ] - }, - "limit": { - "context": 128000, - "output": 16384 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-15", - "last_updated": "2026-03-15", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 2.5, - "output": 10 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "openai/gpt-5.5", - "name": "OpenAI: GPT-5.5", - "display_name": "OpenAI: GPT-5.5", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -59946,10 +62359,10 @@ "mode": "effort", "effort": "medium", "effort_options": [ + "minimal", "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -59962,50 +62375,52 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-05-01", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "OpenAI: GPT-5 Mini", - "display_name": "OpenAI: GPT-5 Mini", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1050000, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ - "minimal", + "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -60018,32 +62433,83 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + } }, "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "OpenAI: GPT-5 Nano", - "display_name": "OpenAI: GPT-5 Nano", + "id": "gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ + "text", "image", - "pdf", + "pdf" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 + }, + "type": "chat" + }, + { + "id": "o1-pro", + "name": "o1-pro", + "display_name": "o1-pro", + "modalities": { + "input": [ + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -60058,13 +62524,6 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -60074,23 +62533,56 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2026-03-15", + "knowledge": "2023-09", + "release_date": "2025-03-19", + "last_updated": "2025-03-19", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 150, + "output": 600 }, "type": "chat" }, { - "id": "openai/gpt-5.3-codex", - "name": "OpenAI: GPT-5.3-Codex", - "display_name": "OpenAI: GPT-5.3-Codex", + "id": "gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ - "image", + "text", + "image" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", + "cost": { + "input": 10, + "output": 30 + }, + "type": "chat" + }, + { + "id": "gpt-5.4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", + "modalities": { + "input": [ + "text", + "image" ], "output": [ "text" @@ -60100,18 +62592,20 @@ "context": 400000, "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ + "none", "low", "medium", "high", @@ -60128,86 +62622,74 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-02-25", - "last_updated": "2026-03-15", - "cost": { - "input": 1.75, - "output": 14 - }, - "type": "chat" - }, - { - "id": "openai/gpt-3.5-turbo-16k", - "name": "OpenAI: GPT-3.5 Turbo 16k", - "display_name": "OpenAI: GPT-3.5 Turbo 16k", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 16385, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2023-08-28", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 3, - "output": 4 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "openai/gpt-4-turbo", - "name": "OpenAI: GPT-4 Turbo", - "display_name": "OpenAI: GPT-4 Turbo", + "id": "o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2023-09-13", - "last_updated": "2024-04-09", + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 10, - "output": 30 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "OpenAI: GPT-5.2", - "display_name": "OpenAI: GPT-5.2", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" @@ -60233,8 +62715,7 @@ "none", "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -60247,32 +62728,33 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2026-03-15", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai/o3-pro", - "name": "OpenAI: o3 Pro", - "display_name": "OpenAI: o3 Pro", + "id": "gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1050000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -60287,6 +62769,13 @@ "mode": "effort", "effort": "medium", "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -60296,30 +62785,48 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2026-03-15", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 20, - "output": 80 + "input": 5, + "output": 30, + "cache_read": 0.5, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + } }, "type": "chat" }, { - "id": "openai/o3-mini-high", - "name": "OpenAI: o3 Mini High", - "display_name": "OpenAI: o3 Mini High", + "id": "gpt-5.4-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1050000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -60332,8 +62839,14 @@ "supported": true, "default_enabled": true, "mode": "effort", - "effort": "medium", + "effort": "high", "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -60343,24 +62856,37 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 30, + "output": 180, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 60, + "output": 270 + } }, "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "OpenAI: GPT-4o-mini", - "display_name": "OpenAI: GPT-4o-mini", + "id": "gpt-5.2-chat-latest", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" @@ -60370,31 +62896,32 @@ "context": 128000, "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "openai/o4-mini-deep-research", - "name": "OpenAI: o4 Mini Deep Research", - "display_name": "OpenAI: o4 Mini Deep Research", + "id": "o4-mini-deep-research", + "name": "o4-mini-deep-research", + "display_name": "o4-mini-deep-research", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" @@ -60404,7 +62931,7 @@ "context": 200000, "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -60426,8 +62953,9 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2024-05", "release_date": "2024-06-26", - "last_updated": "2026-03-15", + "last_updated": "2024-06-26", "cost": { "input": 2, "output": 8, @@ -60436,70 +62964,45 @@ "type": "chat" }, { - "id": "openai/gpt-5.4-mini", - "name": "OpenAI: GPT-5.4 Mini", - "display_name": "OpenAI: GPT-5.4 Mini", + "id": "gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1047576, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-17", - "last_updated": "2026-04-11", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "openai/gpt-5.1-chat", - "name": "OpenAI: GPT-5.1 Chat", - "display_name": "OpenAI: GPT-5.1 Chat", + "id": "gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -60507,34 +63010,33 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8192, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2026-03-15", + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "OpenAI: o4 Mini", - "display_name": "OpenAI: o4 Mini", + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" @@ -60566,24 +63068,24 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2024-05", "release_date": "2025-04-16", - "last_updated": "2026-03-15", + "last_updated": "2025-04-16", "cost": { "input": 1.1, "output": 4.4, - "cache_read": 0.275 + "cache_read": 0.28 }, "type": "chat" }, { - "id": "openai/gpt-5.4-nano", - "name": "OpenAI: GPT-5.4 Nano", - "display_name": "OpenAI: GPT-5.4 Nano", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" @@ -60609,8 +63111,7 @@ "none", "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -60623,19 +63124,20 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-03-17", - "last_updated": "2026-04-11", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai/gpt-5.2-codex", - "name": "OpenAI: GPT-5.2-Codex", - "display_name": "OpenAI: GPT-5.2-Codex", + "id": "gpt-4o-2024-11-20", + "name": "GPT-4o (2024-11-20)", + "display_name": "GPT-4o (2024-11-20)", "modalities": { "input": [ "text", @@ -60645,6 +63147,41 @@ "text" ] }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", + "cost": { + "input": 2.5, + "output": 10, + "cache_read": 1.25 + }, + "type": "chat" + }, + { + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, "limit": { "context": 400000, "output": 128000 @@ -60678,8 +63215,9 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { "input": 1.75, "output": 14, @@ -60688,46 +63226,41 @@ "type": "chat" }, { - "id": "openai/gpt-4o-mini-2024-07-18", - "name": "OpenAI: GPT-4o-mini (2024-07-18)", - "display_name": "OpenAI: GPT-4o-mini (2024-07-18)", + "id": "gpt-image-1", + "name": "gpt-image-1", + "display_name": "gpt-image-1", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2026-03-15", - "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" + "release_date": "2025-04-24", + "last_updated": "2025-04-24", + "type": "imageGeneration" }, { - "id": "openai/gpt-5.1-codex-mini", - "name": "OpenAI: GPT-5.1-Codex-Mini", - "display_name": "OpenAI: GPT-5.1-Codex-Mini", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" @@ -60735,22 +63268,22 @@ }, "limit": { "context": 400000, - "output": 100000 + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", + "minimal", "low", "medium", "high" @@ -60766,9 +63299,10 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", - "cost": { + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { "input": 0.25, "output": 2, "cache_read": 0.025 @@ -60776,138 +63310,11 @@ "type": "chat" }, { - "id": "openai/gpt-4o-2024-08-06", - "name": "OpenAI: GPT-4o (2024-08-06)", - "display_name": "OpenAI: GPT-4o (2024-08-06)", - "modalities": { - "input": [ - "image", - "pdf", - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 16384 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2024-08-06", - "last_updated": "2026-03-15", - "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 - }, - "type": "chat" - }, - { - "id": "openai/gpt-5-image", - "name": "OpenAI: GPT-5 Image", - "display_name": "OpenAI: GPT-5 Image", - "modalities": { - "input": [ - "image", - "pdf", - "text" - ], - "output": [ - "image", - "text" - ] - }, - "limit": { - "context": 400000, - "output": 128000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-14", - "last_updated": "2026-03-15", - "cost": { - "input": 10, - "output": 10 - }, - "type": "chat" - }, - { - "id": "openai/gpt-5.1", - "name": "OpenAI: GPT-5.1", - "display_name": "OpenAI: GPT-5.1", - "modalities": { - "input": [ - "image", - "pdf", - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 400000, - "output": 128000 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2026-03-15", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, - "type": "chat" - }, - { - "id": "openai/o1", - "name": "OpenAI: o1", - "display_name": "OpenAI: o1", + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -60938,35 +63345,37 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-12-05", - "last_updated": "2026-03-15", + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "openai/gpt-5.4-pro", - "name": "OpenAI: GPT-5.4 Pro", - "display_name": "OpenAI: GPT-5.4 Pro", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1050000, + "context": 400000, "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -60977,8 +63386,9 @@ "supported": true, "default_enabled": true, "mode": "effort", - "effort": "high", + "effort": "medium", "effort_options": [ + "low", "medium", "high", "xhigh" @@ -60994,54 +63404,59 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-03-06", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 30, - "output": 180 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo", - "name": "OpenAI: GPT-3.5 Turbo", - "display_name": "OpenAI: GPT-3.5 Turbo", + "id": "gpt-4o-2024-08-06", + "name": "GPT-4o (2024-08-06)", + "display_name": "GPT-4o (2024-08-06)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2023-03-01", - "last_updated": "2023-11-06", + "knowledge": "2023-09", + "release_date": "2024-08-06", + "last_updated": "2024-08-06", "cost": { - "input": 0.5, - "output": 1.5 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "openai/o3-deep-research", - "name": "OpenAI: o3 Deep Research", - "display_name": "OpenAI: o3 Deep Research", + "id": "o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "pdf" ], "output": [ "text" @@ -61051,7 +63466,7 @@ "context": 200000, "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -61073,22 +63488,22 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-06-26", - "last_updated": "2026-03-15", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 10, - "output": 40, - "cache_read": 2.5 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "openai/o3-mini", - "name": "OpenAI: o3 Mini", - "display_name": "OpenAI: o3 Mini", + "id": "o1-mini", + "name": "o1-mini", + "display_name": "o1-mini", "modalities": { "input": [ - "pdf", "text" ], "output": [ @@ -61096,11 +63511,11 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 65536 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -61119,10 +63534,11 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-12-20", - "last_updated": "2026-03-15", + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { "input": 1.1, "output": 4.4, @@ -61131,45 +63547,13 @@ "type": "chat" }, { - "id": "openai/gpt-4-turbo-preview", - "name": "OpenAI: GPT-4 Turbo Preview", - "display_name": "OpenAI: GPT-4 Turbo Preview", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2026-03-15", - "cost": { - "input": 10, - "output": 30 - }, - "type": "chat" - }, - { - "id": "openai/o1-pro", - "name": "OpenAI: o1-pro", - "display_name": "OpenAI: o1-pro", + "id": "o3-deep-research", + "name": "o3-deep-research", + "display_name": "o3-deep-research", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" @@ -61180,7 +63564,7 @@ "output": 100000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -61201,51 +63585,50 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-03-19", - "last_updated": "2026-03-15", + "knowledge": "2024-05", + "release_date": "2024-06-26", + "last_updated": "2024-06-26", "cost": { - "input": 150, - "output": 600 + "input": 10, + "output": 40, + "cache_read": 2.5 }, "type": "chat" }, { - "id": "openai/gpt-5.4-image-2", - "name": "OpenAI: GPT-5.4 Image 2", - "display_name": "OpenAI: GPT-5.4 Image 2", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "image", "text", - "pdf" + "image" ], "output": [ - "image", "text" ] }, "limit": { - "context": 272000, + "context": 400000, "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", + "minimal", "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -61258,140 +63641,134 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-04-21", - "last_updated": "2026-05-01", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 8, - "output": 15, - "cache_read": 2 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai/gpt-4", - "name": "OpenAI: GPT-4", - "display_name": "OpenAI: GPT-4", + "id": "gpt-5.3-chat-latest", + "name": "GPT-5.3 Chat (latest)", + "display_name": "GPT-5.3 Chat (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8191, - "output": 4096 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2023-03-14", - "last_updated": "2024-04-09", + "knowledge": "2025-08-31", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 30, - "output": 60 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "openai/gpt-4-0314", - "name": "OpenAI: GPT-4 (older v0314)", - "display_name": "OpenAI: GPT-4 (older v0314)", + "id": "gpt-image-2", + "name": "gpt-image-2", + "display_name": "gpt-image-2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 8191, - "output": 4096 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2023-05-28", - "last_updated": "2026-03-15", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 30, - "output": 60 + "input": 5, + "output": 30, + "cache_read": 1.25 }, - "type": "chat" - }, + "type": "imageGeneration" + } + ] + }, + "dinference": { + "id": "dinference", + "name": "DInference", + "display_name": "DInference", + "api": "https://api.dinference.com/v1", + "doc": "https://dinference.com", + "models": [ { - "id": "openai/gpt-5-codex", - "name": "OpenAI: GPT-5 Codex", - "display_name": "OpenAI: GPT-5 Codex", + "id": "gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "attachment": false, + "open_weights": true, + "release_date": "2025-08", + "last_updated": "2025-08", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.0675, + "output": 0.27 }, "type": "chat" }, { - "id": "openai/gpt-5.4", - "name": "OpenAI: GPT-5.4", - "display_name": "OpenAI: GPT-5.4", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -61399,117 +63776,79 @@ ] }, "limit": { - "context": 1050000, + "context": 200000, "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-06", - "last_updated": "2026-03-15", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 2.5, - "output": 15 + "input": 1.25, + "output": 3.89 }, "type": "chat" }, { - "id": "openai/gpt-audio", - "name": "OpenAI: GPT Audio", - "display_name": "OpenAI: GPT Audio", + "id": "minimax-m2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "audio", "text" ], "output": [ - "audio", "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2026-01-20", - "last_updated": "2026-03-15", - "cost": { - "input": 2.5, - "output": 10 - }, - "type": "chat" - }, - { - "id": "openai/gpt-4o-search-preview", - "name": "OpenAI: GPT-4o Search Preview", - "display_name": "OpenAI: GPT-4o Search Preview", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 16384 + "supported": true, + "default": true }, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-03-13", - "last_updated": "2026-03-15", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 2.5, - "output": 10 + "input": 0.22, + "output": 0.88 }, "type": "chat" }, { - "id": "openai/gpt-4.1-nano", - "name": "OpenAI: GPT-4.1 Nano", - "display_name": "OpenAI: GPT-4.1 Nano", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -61517,33 +63856,43 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.45, + "output": 1.65 }, "type": "chat" }, { - "id": "openai/o4-mini-high", - "name": "OpenAI: o4 Mini High", - "display_name": "OpenAI: o4 Mini High", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -61552,8 +63901,9 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -61562,58 +63912,72 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-17", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 1.1, - "output": 4.4 + "input": 0.75, + "output": 2.4 }, "type": "chat" - }, + } + ] + }, + "vivgrid": { + "id": "vivgrid", + "name": "Vivgrid", + "display_name": "Vivgrid", + "api": "https://api.vivgrid.com/v1", + "doc": "https://docs.vivgrid.com/models", + "models": [ { - "id": "openai/o3", - "name": "OpenAI: o3", - "display_name": "OpenAI: o3", + "id": "gpt-5.4-nano", + "name": "GPT-5.4 Nano", + "display_name": "GPT-5.4 Nano", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -61623,19 +63987,20 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "OpenAI: gpt-oss-20b", - "display_name": "OpenAI: gpt-oss-20b", + "id": "deepseek-v3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ "text" @@ -61645,8 +64010,8 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -61661,23 +64026,24 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.03, - "output": 0.14 + "input": 0.28, + "output": 0.42 }, "type": "chat" }, { - "id": "openai/gpt-5-pro", - "name": "OpenAI: GPT-5 Pro", - "display_name": "OpenAI: GPT-5 Pro", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "pdf" ], "output": [ "text" @@ -61691,14 +64057,21 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], "verbosity": "medium", "verbosity_options": [ "low", @@ -61710,124 +64083,199 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-10-06", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 15, - "output": 120 + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "openai/gpt-audio-mini", - "name": "OpenAI: GPT Audio Mini", - "display_name": "OpenAI: GPT Audio Mini", + "id": "gpt-5.4-mini", + "name": "GPT-5.4 Mini", + "display_name": "GPT-5.4 Mini", "modalities": { "input": [ - "audio", - "text" + "text", + "image", + "pdf" ], "output": [ - "audio", "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-01-20", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.6, - "output": 2.4 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "OpenAI: GPT-4o", - "display_name": "OpenAI: GPT-4o", + "id": "gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2026-03-15", + "knowledge": "2025-01", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "cache_write": 1 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo-0613", - "name": "OpenAI: GPT-3.5 Turbo (older v0613)", - "display_name": "OpenAI: GPT-3.5 Turbo (older v0613)", + "id": "gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 4095, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2023-06-13", - "last_updated": "2023-06-13", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 1, - "output": 2 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "openai/gpt-5-image-mini", - "name": "OpenAI: GPT-5 Image Mini", - "display_name": "OpenAI: GPT-5 Image Mini", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ - "image", "text" ] }, @@ -61835,31 +64283,53 @@ "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-10-16", - "last_updated": "2026-03-15", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 2.5, - "output": 2 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai/gpt-5", - "name": "OpenAI: GPT-5", - "display_name": "OpenAI: GPT-5", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" @@ -61873,16 +64343,16 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ - "minimal", + "none", "low", "medium", "high" @@ -61896,10 +64366,11 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2026-03-15", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { "input": 1.25, "output": 10, @@ -61908,55 +64379,79 @@ "type": "chat" }, { - "id": "openai/gpt-oss-safeguard-20b", - "name": "OpenAI: gpt-oss-safeguard-20b", - "display_name": "OpenAI: gpt-oss-safeguard-20b", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": false, "open_weights": false, - "release_date": "2025-10-29", - "last_updated": "2025-10-29", + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 0.075, - "output": 0.3, - "cache_read": 0.037 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "OpenAI: gpt-oss-120b", - "display_name": "OpenAI: gpt-oss-120b", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -61964,35 +64459,52 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.039, - "output": 0.19 + "input": 0.25, + "output": 2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "openai/gpt-5.5-pro", - "name": "OpenAI: GPT-5.5 Pro", - "display_name": "OpenAI: GPT-5.5 Pro", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -62001,55 +64513,45 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-05-01", - "cost": { - "input": 30, - "output": 180 - }, - "type": "chat" - }, - { - "id": "openai/gpt-3.5-turbo-instruct", - "name": "OpenAI: GPT-3.5 Turbo Instruct", - "display_name": "OpenAI: GPT-3.5 Turbo Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 4095, - "output": 4096 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2023-03-01", - "last_updated": "2023-09-21", + "knowledge": "2025-08-31", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 1.5, - "output": 2 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "OpenAI: GPT-4.1", - "display_name": "OpenAI: GPT-4.1", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -62057,93 +64559,73 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2026-03-15", - "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, - "type": "chat" - }, - { - "id": "openai/gpt-4.1-mini", - "name": "OpenAI: GPT-4.1 Mini", - "display_name": "OpenAI: GPT-4.1 Mini", - "modalities": { - "input": [ - "image", - "pdf", - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1047576, - "output": 32768 + "supported": true, + "default": true }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex", - "name": "OpenAI: GPT-5.1-Codex", - "display_name": "OpenAI: GPT-5.1-Codex", + "id": "gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1050000, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -62156,23 +64638,46 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 5, + "output": 30, + "cache_read": 0.5, + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + }, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" - }, + } + ] + }, + "cerebras": { + "id": "cerebras", + "name": "Cerebras", + "display_name": "Cerebras", + "doc": "https://inference-docs.cerebras.ai/models/overview", + "models": [ { - "id": "openai/gpt-4o-2024-11-20", - "name": "OpenAI: GPT-4o (2024-11-20)", - "display_name": "OpenAI: GPT-4o (2024-11-20)", + "id": "zai-glm-4.7", + "name": "Z.AI GLM-4.7", + "display_name": "Z.AI GLM-4.7", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -62180,32 +64685,32 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 40000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-11-20", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "release_date": "2026-01-10", + "last_updated": "2026-01-10", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 2.25, + "output": 2.75, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "amazon/nova-lite-v1", - "name": "Amazon: Nova Lite 1.0", - "display_name": "Amazon: Nova Lite 1.0", + "id": "qwen-3-235b-a22b-instruct-2507", + "name": "Qwen 3 235B Instruct", + "display_name": "Qwen 3 235B Instruct", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -62213,63 +64718,68 @@ ] }, "limit": { - "context": 300000, - "output": 5120 + "context": 131000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", "cost": { - "input": 0.06, - "output": 0.24 + "input": 0.6, + "output": 1.2 }, "type": "chat" }, { - "id": "amazon/nova-pro-v1", - "name": "Amazon: Nova Pro 1.0", - "display_name": "Amazon: Nova Pro 1.0", + "id": "gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 5120 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.8, - "output": 3.2 + "input": 0.25, + "output": 0.69 }, "type": "chat" }, { - "id": "amazon/nova-premier-v1", - "name": "Amazon: Nova Premier 1.0", - "display_name": "Amazon: Nova Premier 1.0", + "id": "llama3.1-8b", + "name": "Llama 3.1 8B", + "display_name": "Llama 3.1 8B", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -62277,8 +64787,49 @@ ] }, "limit": { - "context": 1000000, - "output": 32000 + "context": 32000, + "output": 8000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0.1, + "output": 0.1 + }, + "type": "chat" + } + ] + }, + "cloudflare-ai-gateway": { + "id": "cloudflare-ai-gateway", + "name": "Cloudflare AI Gateway", + "display_name": "Cloudflare AI Gateway", + "doc": "https://developers.cloudflare.com/ai-gateway/", + "models": [ + { + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -62287,53 +64838,77 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-11-01", - "last_updated": "2026-03-15", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { "input": 2.5, - "output": 12.5 + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "amazon/nova-2-lite-v1", - "name": "Amazon: Nova 2 Lite", - "display_name": "Amazon: Nova 2 Lite", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "image", - "pdf", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65535 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.3, - "output": 2.5 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "amazon/nova-micro-v1", - "name": "Amazon: Nova Micro 1.0", - "display_name": "Amazon: Nova Micro 1.0", + "id": "openai/gpt-3.5-turbo", + "name": "GPT-3.5-turbo", + "display_name": "GPT-3.5-turbo", "modalities": { "input": [ "text" @@ -62343,153 +64918,196 @@ ] }, "limit": { - "context": 128000, - "output": 5120 + "context": 16385, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2026-03-15", + "knowledge": "2021-09-01", + "release_date": "2023-03-01", + "last_updated": "2023-11-06", "cost": { - "input": 0.035, - "output": 0.14 + "input": 0.5, + "output": 1.5, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "z-ai/glm-5v-turbo", - "name": "Z.ai: GLM 5V Turbo", - "display_name": "Z.ai: GLM 5V Turbo", + "id": "openai/o3-pro", + "name": "o3-pro", + "display_name": "o3-pro", "modalities": { "input": [ - "image", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-11", + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24 + "input": 20, + "output": 80 }, "type": "chat" }, { - "id": "z-ai/glm-4.7", - "name": "Z.ai: GLM 4.7", - "display_name": "Z.ai: GLM 4.7", + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-22", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.38, - "output": 1.98, - "cache_read": 0.2 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "z-ai/glm-5", - "name": "Z.ai: GLM 5", - "display_name": "Z.ai: GLM 5", + "id": "openai/gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.72, - "output": 2.3 + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "z-ai/glm-4-32b", - "name": "Z.ai: GLM 4 32B ", - "display_name": "Z.ai: GLM 4 32B ", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -62497,97 +65115,111 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-25", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "z-ai/glm-5.1", - "name": "Z.ai: GLM 5.1", - "display_name": "Z.ai: GLM 5.1", + "id": "openai/gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "attachment": true, + "open_weights": false, + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 1.26, - "output": 3.96 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "z-ai/glm-4.5", - "name": "Z.ai: GLM 4.5", - "display_name": "Z.ai: GLM 4.5", + "id": "openai/o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.175 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "z-ai/glm-4.5-air", - "name": "Z.ai: GLM 4.5 Air", - "display_name": "Z.ai: GLM 4.5 Air", + "id": "openai/gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ "text" @@ -62597,43 +65229,43 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0.13, - "output": 0.85, - "cache_read": 0.025 + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "z-ai/glm-5-turbo", - "name": "Z.ai: GLM 5 Turbo", - "display_name": "Z.ai: GLM 5 Turbo", + "id": "openai/o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -62641,24 +65273,34 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-15", - "last_updated": "2026-04-11", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24 + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 }, "type": "chat" }, { - "id": "z-ai/glm-4.5v", - "name": "Z.ai: GLM 4.5V", - "display_name": "Z.ai: GLM 4.5V", + "id": "openai/gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ "text", @@ -62669,43 +65311,67 @@ ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.6, - "output": 1.8, - "cache_read": 0.11 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "z-ai/glm-4.6", - "name": "Z.ai: GLM 4.6", - "display_name": "Z.ai: GLM 4.6", + "id": "openai/gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 204800 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -62713,71 +65379,104 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-30", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.39, - "output": 1.9, + "input": 1.75, + "output": 14, "cache_read": 0.175 }, "type": "chat" }, { - "id": "z-ai/glm-4.6v", - "name": "Z.ai: GLM 4.6V", - "display_name": "Z.ai: GLM 4.6V", + "id": "openai/o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-09-30", - "last_updated": "2026-01-10", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 0.3, - "output": 0.9 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "z-ai/glm-4.7-flash", - "name": "Z.ai: GLM 4.7 Flash", - "display_name": "Z.ai: GLM 4.7 Flash", + "id": "openai/gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 40551 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -62785,465 +65484,617 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.06, - "output": 0.4, - "cache_read": 0.01 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-vl-424b-a47b", - "name": "Baidu: ERNIE 4.5 VL 424B A47B ", - "display_name": "Baidu: ERNIE 4.5 VL 424B A47B ", + "id": "openai/o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 123000, - "output": 16000 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, - "open_weights": true, - "release_date": "2025-06-30", - "last_updated": "2026-01", + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.42, - "output": 1.25 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "baidu/qianfan-ocr-fast:free", - "name": "Baidu: Qianfan-OCR-Fast (free)", - "display_name": "Baidu: Qianfan-OCR-Fast (free)", + "id": "anthropic/claude-haiku-4-5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 28672 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-04-20", - "last_updated": "2026-05-01", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0, - "output": 0 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "baidu/cobuddy:free", - "name": "Baidu: CoBuddy (free)", - "display_name": "Baidu: CoBuddy (free)", - "modalities": { - "input": [ - "text" + "id": "anthropic/claude-3-sonnet", + "name": "Claude Sonnet 3", + "display_name": "Claude Sonnet 3", + "modalities": { + "input": [ + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 200000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-05-06", - "last_updated": "2026-05-07", + "knowledge": "2023-08-31", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-vl-28b-a3b", - "name": "Baidu: ERNIE 4.5 VL 28B A3B", - "display_name": "Baidu: ERNIE 4.5 VL 28B A3B", + "id": "anthropic/claude-3-haiku", + "name": "Claude Haiku 3", + "display_name": "Claude Haiku 3", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 30000, - "output": 8000 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-06-30", - "last_updated": "2025-06-30", + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", "cost": { - "input": 0.14, - "output": 0.56 + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-21b-a3b", - "name": "Baidu: ERNIE 4.5 21B A3B", - "display_name": "Baidu: ERNIE 4.5 21B A3B", + "id": "anthropic/claude-sonnet-4-5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 120000, - "output": 8000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-30", - "last_updated": "2025-06-30", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.07, - "output": 0.28 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-300b-a47b", - "name": "Baidu: ERNIE 4.5 300B A47B ", - "display_name": "Baidu: ERNIE 4.5 300B A47B ", + "id": "anthropic/claude-3.5-sonnet", + "name": "Claude Sonnet 3.5 v2", + "display_name": "Claude Sonnet 3.5 v2", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 123000, - "output": 12000 + "context": 200000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-30", - "last_updated": "2026-01", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.28, - "output": 1.1 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-21b-a3b-thinking", - "name": "Baidu: ERNIE 4.5 21B A3B Thinking", - "display_name": "Baidu: ERNIE 4.5 21B A3B Thinking", + "id": "anthropic/claude-opus-4", + "name": "Claude Opus 4 (latest)", + "display_name": "Claude Opus 4 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 200000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.07, - "output": 0.28 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "relace/relace-apply-3", - "name": "Relace: Relace Apply 3", - "display_name": "Relace: Relace Apply 3", + "id": "anthropic/claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 1000000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-09-26", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 0.85, - "output": 1.25 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5 + } }, "type": "chat" }, { - "id": "relace/relace-search", - "name": "Relace: Relace Search", - "display_name": "Relace: Relace Search", + "id": "anthropic/claude-opus-4-1", + "name": "Claude Opus 4.1 (latest)", + "display_name": "Claude Opus 4.1 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-12-09", - "last_updated": "2026-03-15", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1, - "output": 3 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "minimax/minimax-m2.7", - "name": "MiniMax: MiniMax M2.7", - "display_name": "MiniMax: MiniMax M2.7", + "id": "anthropic/claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], "interleaved": true, "summaries": true, - "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "knowledge": "2026-01", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "minimax/minimax-m2", - "name": "MiniMax: MiniMax M2", - "display_name": "MiniMax: MiniMax M2", + "id": "anthropic/claude-3-opus", + "name": "Claude Opus 3", + "display_name": "Claude Opus 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-10-23", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", "cost": { - "input": 0.255, - "output": 1, - "cache_read": 0.03 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "minimax/minimax-01", - "name": "MiniMax: MiniMax-01", - "display_name": "MiniMax: MiniMax-01", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4 (latest)", + "display_name": "Claude Sonnet 4 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000192, - "output": 1000192 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-01-15", - "last_updated": "2025-01-15", + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.2, - "output": 1.1 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "minimax/minimax-m2.1", - "name": "MiniMax: MiniMax M2.1", - "display_name": "MiniMax: MiniMax M2.1", + "id": "anthropic/claude-3-5-haiku", + "name": "Claude Haiku 3.5 (latest)", + "display_name": "Claude Haiku 3.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 39322 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "attachment": true, + "open_weights": false, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.27, - "output": 0.95, - "cache_read": 0.03 + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "minimax/minimax-m1", - "name": "MiniMax: MiniMax M1", - "display_name": "MiniMax: MiniMax M1", + "id": "anthropic/claude-opus-4-6", + "name": "Claude Opus 4.6 (latest)", + "display_name": "Claude Opus 4.6 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -63251,70 +66102,124 @@ }, "limit": { "context": 1000000, - "output": 40000 + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.4, - "output": 2.2 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "tiers": [ + { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5 + } }, "type": "chat" }, { - "id": "minimax/minimax-m2-her", - "name": "MiniMax: MiniMax M2-her", - "display_name": "MiniMax: MiniMax M2-her", + "id": "anthropic/claude-3.5-haiku", + "name": "Claude Haiku 3.5 (latest)", + "display_name": "Claude Haiku 3.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 2048 + "context": 200000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-01-23", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5", - "name": "MiniMax: MiniMax M2.5", - "display_name": "MiniMax: MiniMax M2.5", + "id": "anthropic/claude-opus-4-5", + "name": "Claude Opus 4.5 (latest)", + "display_name": "Claude Opus 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -63327,34 +66232,38 @@ "supported": true } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.25, - "output": 1.2, - "cache_read": 0.029 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b", - "name": "Qwen: Qwen3 235B A22B", - "display_name": "Qwen: Qwen3 235B A22B", + "id": "openai/gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -63363,48 +66272,81 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2024-12-01", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0.455, - "output": 1.82, - "cache_read": 0.15 + "input": 5, + "output": 30, + "cache_read": 0.5, + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + }, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" - }, + } + ] + }, + "vultr": { + "id": "vultr", + "name": "Vultr", + "display_name": "Vultr", + "api": "https://api.vultrinference.com/v1", + "doc": "https://api.vultrinference.com/", + "models": [ { - "id": "qwen/qwen3.5-122b-a10b", - "name": "Qwen: Qwen3.5-122B-A10B", - "display_name": "Qwen: Qwen3.5-122B-A10B", + "id": "Kimi-K2.5", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 254000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -63417,20 +66359,21 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-03-15", + "knowledge": "2024-04", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.26, - "output": 2.08 + "input": 0.55, + "output": 2.75 }, "type": "chat" }, { - "id": "qwen/qwen3-coder-plus", - "name": "Qwen: Qwen3 Coder Plus", - "display_name": "Qwen: Qwen3 Coder Plus", + "id": "DeepSeek-V3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -63440,119 +66383,108 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 127000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2026-03-15", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.65, - "output": 3.25, - "cache_read": 0.2 + "input": 0.55, + "output": 1.65 }, "type": "chat" }, { - "id": "qwen/qwen3.6-27b", - "name": "Qwen: Qwen3.6 27B", - "display_name": "Qwen: Qwen3.6 27B", + "id": "MiniMax-M2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 194000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-27", - "last_updated": "2026-05-01", + "attachment": false, + "open_weights": true, + "knowledge": "2024-09", + "release_date": "2025-02-11", + "last_updated": "2025-02-11", "cost": { - "input": 0.325, - "output": 3.25 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "qwen/qwen3.5-27b", - "name": "Qwen: Qwen3.5-27B", - "display_name": "Qwen: Qwen3.5-27B", + "id": "gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 129000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-03-15", + "knowledge": "2024-06", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.195, - "output": 1.56 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-2507", - "name": "Qwen: Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen: Qwen3 235B A22B Instruct 2507", + "id": "GLM-5-FP8", + "name": "GLM 5 FP8", + "display_name": "GLM 5 FP8", "modalities": { "input": [ "text" @@ -63562,29 +66494,38 @@ ] }, "limit": { - "context": 262144, - "output": 52429 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-04", - "last_updated": "2026-01", + "knowledge": "2025-05", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.071, - "output": 0.1 + "input": 0.85, + "output": 3.1 }, "type": "chat" - }, + } + ] + }, + "kuae-cloud-coding-plan": { + "id": "kuae-cloud-coding-plan", + "name": "KUAE Cloud Coding Plan", + "display_name": "KUAE Cloud Coding Plan", + "api": "https://coding-plan-endpoint.kuaecloud.net/v1", + "doc": "https://docs.mthreads.com/kuaecloud/kuaecloud-doc-online/coding_plan/", + "models": [ { - "id": "qwen/qwen3-8b", - "name": "Qwen: Qwen3 8B", - "display_name": "Qwen: Qwen3 8B", + "id": "GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -63594,8 +66535,8 @@ ] }, "limit": { - "context": 40960, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -63616,32 +66557,41 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-04", - "last_updated": "2026-03-15", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.05 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "modelscope": { + "id": "modelscope", + "name": "ModelScope", + "display_name": "ModelScope", + "api": "https://api-inference.modelscope.cn/v1", + "doc": "https://modelscope.cn/docs/model-service/API-Inference/intro", + "models": [ { - "id": "qwen/qwen3.5-397b-a17b", - "name": "Qwen: Qwen3.5 397B A17B", - "display_name": "Qwen: Qwen3.5 397B A17B", + "id": "ZhipuAI/GLM-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -63649,34 +66599,23 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-15", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.39, - "output": 2.34 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwen-vl-plus", - "name": "Qwen: Qwen VL Plus", - "display_name": "Qwen: Qwen VL Plus", + "id": "ZhipuAI/GLM-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -63684,29 +66623,35 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 202752, + "output": 98304 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.1365, - "output": 0.4095, - "cache_read": 0.042 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwen3-32b", - "name": "Qwen: Qwen3 32B", - "display_name": "Qwen: Qwen3 32B", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen3-235B-A22B-Thinking-2507", "modalities": { "input": [ "text" @@ -63716,8 +66661,8 @@ ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -63738,22 +66683,21 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-12-01", - "last_updated": "2026-02-04", + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 0.08, - "output": 0.24, - "cache_read": 0.04 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwen2.5-vl-72b-instruct", - "name": "Qwen: Qwen2.5 VL 72B Instruct", - "display_name": "Qwen: Qwen2.5 VL 72B Instruct", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -63761,29 +66705,29 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 262144, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-02-01", - "last_updated": "2026-03-15", + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { - "input": 0.8, - "output": 0.8, - "cache_read": 0.075 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwen-max", - "name": "Qwen: Qwen-Max ", - "display_name": "Qwen: Qwen-Max ", + "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ "text" @@ -63793,8 +66737,8 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -63802,20 +66746,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-04-03", - "last_updated": "2026-03-15", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "cost": { - "input": 1.04, - "output": 4.16, - "cache_read": 0.32 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwen-plus", - "name": "Qwen: Qwen-Plus", - "display_name": "Qwen: Qwen-Plus", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -63825,45 +66769,32 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2025-09-11", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-07-21", "cost": { - "input": 0.4, - "output": 1.2, - "cache_read": 0.08 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwen3.6-35b-a3b", - "name": "Qwen: Qwen3.6 35B A3B", - "display_name": "Qwen: Qwen3.6 35B A3B", + "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "name": "Qwen3 30B A3B Thinking 2507", + "display_name": "Qwen3 30B A3B Thinking 2507", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" @@ -63871,10 +66802,10 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -63890,24 +66821,32 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-27", - "last_updated": "2026-05-01", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { - "input": 0.1612, - "output": 0.96525, - "cache_read": 0.1612 + "input": 0, + "output": 0 }, "type": "chat" - }, + } + ] + }, + "kimi-for-coding": { + "id": "kimi-for-coding", + "name": "Kimi For Coding", + "display_name": "Kimi For Coding", + "api": "https://api.kimi.com/coding/v1", + "doc": "https://www.kimi.com/coding/docs/en/third-party-agents.html", + "models": [ { - "id": "qwen/qwen3-vl-235b-a22b-thinking", - "name": "Qwen: Qwen3 VL 235B A22B Thinking", - "display_name": "Qwen: Qwen3 VL 235B A22B Thinking", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -63915,7 +66854,7 @@ ] }, "limit": { - "context": 131072, + "context": 262144, "output": 32768 }, "temperature": true, @@ -63935,31 +66874,35 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-09-24", - "last_updated": "2026-03-15", + "knowledge": "2025-07", + "release_date": "2025-11", + "last_updated": "2025-12", "cost": { - "input": 0.26, - "output": 2.6 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-30b-a3b-thinking", - "name": "Qwen: Qwen3 VL 30B A3B Thinking", - "display_name": "Qwen: Qwen3 VL 30B A3B Thinking", + "id": "k2p6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ + "text", "image", - "text" + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 262144, "output": 32768 }, "temperature": true, @@ -63968,111 +66911,104 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-10-11", - "last_updated": "2026-03-15", + "knowledge": "2025-01", + "release_date": "2026-04", + "last_updated": "2026-04", "cost": { - "input": 0.13, - "output": 1.56 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-8b-instruct", - "name": "Qwen: Qwen3 VL 8B Instruct", - "display_name": "Qwen: Qwen3 VL 8B Instruct", + "id": "k2p5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ + "text", "image", - "text" + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 262144, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.08, - "output": 0.5 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "lucidquery": { + "id": "lucidquery", + "name": "LucidQuery AI", + "display_name": "LucidQuery AI", + "api": "https://lucidquery.com/api/v1", + "doc": "https://lucidquery.com/api/docs", + "models": [ { - "id": "qwen/qwen3.5-flash-02-23", - "name": "Qwen: Qwen3.5-Flash", - "display_name": "Qwen: Qwen3.5-Flash", + "id": "lucidquery-nexus-coder", + "name": "LucidQuery Nexus Coder", + "display_name": "LucidQuery Nexus Coder", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 250000, + "output": 60000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2025-08-01", + "release_date": "2025-09-01", + "last_updated": "2025-09-01", "cost": { - "input": 0.1, - "output": 0.4 + "input": 2, + "output": 5 }, "type": "chat" }, { - "id": "qwen/qwen3.6-plus", - "name": "Qwen: Qwen3.6 Plus", - "display_name": "Qwen: Qwen3.6 Plus", + "id": "lucidnova-rf1-100b", + "name": "LucidNova RF1 100B", + "display_name": "LucidNova RF1 100B", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -64080,42 +67016,39 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 120000, + "output": 8000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2026-04-11", + "knowledge": "2025-09-16", + "release_date": "2024-12-28", + "last_updated": "2025-09-10", "cost": { - "input": 0.325, - "output": 1.95, - "cache_read": 0.0325, - "cache_write": 0.40625 + "input": 2, + "output": 5 }, "type": "chat" - }, + } + ] + }, + "neuralwatt": { + "id": "neuralwatt", + "name": "Neuralwatt", + "display_name": "Neuralwatt", + "api": "https://api.neuralwatt.com/v1", + "doc": "https://portal.neuralwatt.com/docs", + "models": [ { - "id": "qwen/qwen3-max", - "name": "Qwen: Qwen3 Max", - "display_name": "Qwen: Qwen3 Max", + "id": "qwen3.5-397b-fast", + "name": "Qwen3.5 397B Fast", + "display_name": "Qwen3.5 397B Fast", "modalities": { "input": [ "text" @@ -64125,8 +67058,8 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 262128, + "output": 262128 }, "temperature": true, "tool_call": true, @@ -64145,20 +67078,19 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-05", - "last_updated": "2026-03-15", + "open_weights": true, + "release_date": "2026-02-01", + "last_updated": "2026-02-01", "cost": { - "input": 1.2, - "output": 6, - "cache_read": 0.24 + "input": 0.69, + "output": 4.14 }, "type": "chat" }, { - "id": "qwen/qwen-plus-2025-07-28", - "name": "Qwen: Qwen Plus 0728", - "display_name": "Qwen: Qwen Plus 0728", + "id": "glm-5-fast", + "name": "GLM 5 Fast", + "display_name": "GLM 5 Fast", "modalities": { "input": [ "text" @@ -64168,39 +67100,28 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 202736, + "output": 202736 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-09-09", - "last_updated": "2026-03-15", + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 0.26, - "output": 0.78 + "input": 1.1, + "output": 3.6 }, "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b-instruct-2507", - "name": "Qwen: Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen: Qwen3 30B A3B Instruct 2507", + "id": "glm-5.1-fast", + "name": "GLM 5.1 Fast", + "display_name": "GLM 5.1 Fast", "modalities": { "input": [ "text" @@ -64210,8 +67131,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 202736, + "output": 202736 }, "temperature": true, "tool_call": true, @@ -64220,19 +67141,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-07-29", - "last_updated": "2026-03-15", + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 0.09, - "output": 0.3, - "cache_read": 0.04 + "input": 1.1, + "output": 3.6 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-32b-instruct", - "name": "Qwen: Qwen3 VL 32B Instruct", - "display_name": "Qwen: Qwen3 VL 32B Instruct", + "id": "kimi-k2.6-fast", + "name": "Kimi K2.6 Fast", + "display_name": "Kimi K2.6 Fast", "modalities": { "input": [ "text", @@ -64243,8 +67163,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262128, + "output": 262128 }, "temperature": true, "tool_call": true, @@ -64252,36 +67172,36 @@ "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-10-21", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.104, - "output": 0.416 + "input": 0.69, + "output": 3.22 }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-thinking-2507", - "name": "Qwen: Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen: Qwen3 235B A22B Thinking 2507", + "id": "qwen3.6-35b-fast", + "name": "Qwen3.6 35B Fast", + "display_name": "Qwen3.6 35B Fast", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131056, + "output": 131056 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -64294,74 +67214,64 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-07-25", - "last_updated": "2026-03-15", + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 0.11, - "output": 0.6 + "input": 0.05, + "output": 0.1 }, "type": "chat" }, { - "id": "qwen/qwen3-next-80b-a3b-thinking", - "name": "Qwen: Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen: Qwen3 Next 80B A3B Thinking", + "id": "kimi-k2.5-fast", + "name": "Kimi K2.5 Fast", + "display_name": "Kimi K2.5 Fast", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262128, + "output": 262128 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-09-11", - "last_updated": "2026-03-15", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.0975, - "output": 0.78 + "input": 0.52, + "output": 2.59 }, "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b-thinking-2507", - "name": "Qwen: Qwen3 30B A3B Thinking 2507", - "display_name": "Qwen: Qwen3 30B A3B Thinking 2507", + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 6554 + "context": 262128, + "output": 262128 }, "temperature": true, "tool_call": true, @@ -64380,51 +67290,20 @@ ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-29", - "last_updated": "2025-07-29", - "cost": { - "input": 0.051, - "output": 0.34 - }, - "type": "chat" - }, - { - "id": "qwen/qwen-2.5-7b-instruct", - "name": "Qwen: Qwen2.5 7B Instruct", - "display_name": "Qwen: Qwen2.5 7B Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32768, - "output": 6554 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2024-09", - "last_updated": "2025-04-16", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.04, - "output": 0.1 + "input": 0.69, + "output": 3.22 }, "type": "chat" }, { - "id": "qwen/qwen-vl-max", - "name": "Qwen: Qwen VL Max", - "display_name": "Qwen: Qwen VL Max", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", @@ -64435,28 +67314,40 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262128, + "output": 262128 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "release_date": "2024-04-08", - "last_updated": "2025-08-13", + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.8, - "output": 3.2 + "input": 0.52, + "output": 2.59 }, "type": "chat" }, { - "id": "qwen/qwen3-coder-flash", - "name": "Qwen: Qwen3 Coder Flash", - "display_name": "Qwen: Qwen3 Coder Flash", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -64466,29 +67357,34 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 16368, + "output": 16368 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-23", - "last_updated": "2026-03-15", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.195, - "output": 0.975, - "cache_read": 0.06 + "input": 0.03, + "output": 0.16 }, "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b", - "name": "Qwen: Qwen3 30B A3B", - "display_name": "Qwen: Qwen3 30B A3B", + "id": "zai-org/GLM-5.1-FP8", + "name": "GLM 5.1 FP8", + "display_name": "GLM 5.1 FP8", "modalities": { "input": [ "text" @@ -64498,8 +67394,8 @@ ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 202736, + "output": 202736 }, "temperature": true, "tool_call": true, @@ -64520,63 +67416,61 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-04", - "last_updated": "2026-03-15", + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 0.08, - "output": 0.28, - "cache_read": 0.03 + "input": 1.1, + "output": 3.6 }, "type": "chat" }, { - "id": "qwen/qwen3-next-80b-a3b-instruct", - "name": "Qwen: Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen: Qwen3 Next 80B A3B Instruct", + "id": "mistralai/Devstral-Small-2-24B-Instruct-2512", + "name": "Devstral Small 2 24B Instruct 2512", + "display_name": "Devstral Small 2 24B Instruct 2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 52429 + "context": 262128, + "output": 262128 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-09-11", - "last_updated": "2026-03-15", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "cost": { - "input": 0.09, - "output": 1.1 + "input": 0.12, + "output": 0.35 }, "type": "chat" }, { - "id": "qwen/qwen3.5-plus-20260420", - "name": "Qwen: Qwen3.5 Plus 2026-04-20", - "display_name": "Qwen: Qwen3.5 Plus 2026-04-20", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 196592, + "output": 196592 }, "temperature": true, "tool_call": true, @@ -64595,20 +67489,20 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-27", - "last_updated": "2026-05-01", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.4, - "output": 2.4 + "input": 0.35, + "output": 1.38 }, "type": "chat" }, { - "id": "qwen/qwen3-coder-next", - "name": "Qwen: Qwen3 Coder Next", - "display_name": "Qwen: Qwen3 Coder Next", + "id": "Qwen/Qwen3.5-397B-A17B-FP8", + "name": "Qwen3.5 397B A17B FP8", + "display_name": "Qwen3.5 397B A17B FP8", "modalities": { "input": [ "text" @@ -64618,135 +67512,189 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 262128, + "output": 262128 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2026-02-02", - "last_updated": "2026-03-15", + "release_date": "2026-02-01", + "last_updated": "2026-02-01", "cost": { - "input": 0.12, - "output": 0.75, - "cache_read": 0.035 + "input": 0.69, + "output": 4.14 }, "type": "chat" }, { - "id": "qwen/qwen-2.5-coder-32b-instruct", - "name": "Qwen2.5 Coder 32B Instruct", - "display_name": "Qwen2.5 Coder 32B Instruct", + "id": "Qwen/Qwen3.6-35B-A3B", + "name": "Qwen3.6 35B A3B", + "display_name": "Qwen3.6 35B A3B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 131056, + "output": 131056 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "release_date": "2024-11-11", - "last_updated": "2026-03-15", + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 0.2, - "output": 0.2, - "cache_read": 0.015 + "input": 0.05, + "output": 0.1 }, "type": "chat" - }, + } + ] + }, + "azure-cognitive-services": { + "id": "azure-cognitive-services", + "name": "Azure Cognitive Services", + "display_name": "Azure Cognitive Services", + "doc": "https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models", + "models": [ { - "id": "qwen/qwen3-vl-30b-a3b-instruct", - "name": "Qwen: Qwen3 VL 30B A3B Instruct", - "display_name": "Qwen: Qwen3 VL 30B A3B Instruct", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-10-05", - "last_updated": "2025-11-25", + "open_weights": false, + "knowledge": "2025-02-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.13, - "output": 0.52 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "qwen/qwen3-coder-30b-a3b-instruct", - "name": "Qwen: Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen: Qwen3 Coder 30B A3B Instruct", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 160000, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-31", - "last_updated": "2025-07-31", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.07, - "output": 0.27 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "qwen/qwen3-max-thinking", - "name": "Qwen: Qwen3 Max Thinking", - "display_name": "Qwen: Qwen3 Max Thinking", + "id": "claude-opus-4-1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -64756,72 +67704,107 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-01-23", - "last_updated": "2026-03-15", + "knowledge": "2025-03-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.78, - "output": 3.9 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "qwen/qwen-turbo", - "name": "Qwen: Qwen-Turbo", - "display_name": "Qwen: Qwen-Turbo", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-11-01", - "last_updated": "2026-03-15", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.0325, - "output": 0.13, - "cache_read": 0.01 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "tiers": [ + { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5 + } }, "type": "chat" }, { - "id": "qwen/qwen3-vl-235b-a22b-instruct", - "name": "Qwen: Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen: Qwen3 VL 235B A22B Instruct", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", @@ -64833,73 +67816,48 @@ }, "limit": { "context": 262144, - "output": 52429 + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2025-09-23", - "last_updated": "2026-01-10", - "cost": { - "input": 0.2, - "output": 0.88, - "cache_read": 0.11 - }, - "type": "chat" - }, - { - "id": "qwen/qwen3-coder", - "name": "Qwen: Qwen3 Coder 480B A35B", - "display_name": "Qwen: Qwen3 Coder 480B A35B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 52429 + "supported": true, + "default": true }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true + } }, "attachment": false, "open_weights": true, - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "knowledge": "2025-01", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.22, - "output": 1, - "cache_read": 0.022 + "input": 0.95, + "output": 4 }, "type": "chat" }, { - "id": "qwen/qwen3.5-9b", - "name": "Qwen: Qwen3.5-9B", - "display_name": "Qwen: Qwen3.5-9B", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "image", "text", - "video" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -64909,43 +67867,40 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": true, - "open_weights": true, - "release_date": "2026-03-10", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "cost": { - "input": 0.05, - "output": 0.15 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-8b-thinking", - "name": "Qwen: Qwen3 VL 8B Thinking", - "display_name": "Qwen: Qwen3 VL 8B Thinking", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -64954,39 +67909,52 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.117, - "output": 1.365 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "qwen/qwen3.6-max-preview", - "name": "Qwen: Qwen3.6 Max Preview", - "display_name": "Qwen: Qwen3.6 Max Preview", + "id": "grok-4-fast-reasoning", + "name": "Grok 4 Fast (Reasoning)", + "display_name": "Grok 4 Fast (Reasoning)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -64996,30 +67964,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-04-27", - "last_updated": "2026-05-01", + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 1.04, - "output": 6.24, - "cache_write": 1.3 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "qwen/qwen-plus-2025-07-28:thinking", - "name": "Qwen: Qwen Plus 0728 (thinking)", - "display_name": "Qwen: Qwen Plus 0728 (thinking)", + "id": "phi-4-mini-reasoning", + "name": "Phi-4-mini-reasoning", + "display_name": "Phi-4-mini-reasoning", "modalities": { "input": [ "text" @@ -65029,8 +67992,8 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -65040,49 +68003,51 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-09-09", - "last_updated": "2026-03-15", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.26, - "output": 0.78 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen/qwen-2.5-72b-instruct", - "name": "Qwen2.5 72B Instruct", - "display_name": "Qwen2.5 72B Instruct", + "id": "cohere-embed-v-4-0", + "name": "Embed v4", + "display_name": "Embed v4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2024-09", - "last_updated": "2026-01-10", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { "input": 0.12, - "output": 0.39 + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwen3-14b", - "name": "Qwen: Qwen3 14B", - "display_name": "Qwen: Qwen3 14B", + "id": "o1-mini", + "name": "o1-mini", + "display_name": "o1-mini", "modalities": { "input": [ "text" @@ -65092,10 +68057,10 @@ ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 128000, + "output": 65536 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -65104,134 +68069,114 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "release_date": "2025-04", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 0.06, - "output": 0.24, - "cache_read": 0.025 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "qwen/qwen3.5-35b-a3b", - "name": "Qwen: Qwen3.5-35B-A3B", - "display_name": "Qwen: Qwen3.5-35B-A3B", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-03-15", + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.1625, - "output": 1.3 + "input": 0.71, + "output": 0.71 }, "type": "chat" }, { - "id": "qwen/qwen3.5-plus-02-15", - "name": "Qwen: Qwen3.5 Plus 2026-02-15", - "display_name": "Qwen: Qwen3.5 Plus 2026-02-15", + "id": "gpt-5.2-chat", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ - "image", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, "open_weights": false, - "release_date": "2026-02-15", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.26, - "output": 1.56 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "qwen/qwen3.6-flash", - "name": "Qwen: Qwen3.6 Flash", - "display_name": "Qwen: Qwen3.6 Flash", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -65240,60 +68185,96 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-27", - "last_updated": "2026-05-01", + "knowledge": "2025-08-31", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0.25, - "output": 1.5, - "cache_write": 0.3125 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "alfredpros/codellama-7b-instruct-solidity", - "name": "AlfredPros: CodeLLaMa 7B Instruct Solidity", - "display_name": "AlfredPros: CodeLLaMa 7B Instruct Solidity", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 272000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-14", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.8, - "output": 1.2 + "input": 0.25, + "output": 2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "kwaipilot/kat-coder-pro-v2", - "name": "Kwaipilot: KAT-Coder-Pro V2", - "display_name": "Kwaipilot: KAT-Coder-Pro V2", + "id": "meta-llama-3.1-8b-instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" @@ -65303,8 +68284,8 @@ ] }, "limit": { - "context": 256000, - "output": 80000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -65313,127 +68294,100 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-04-11", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "output": 0.61 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro-preview-05-06", - "name": "Google: Gemini 2.5 Pro Preview 05-06", - "display_name": "Google: Gemini 2.5 Pro Preview 05-06", + "id": "gpt-5-chat", + "name": "GPT-5 Chat", + "display_name": "GPT-5 Chat", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, "open_weights": false, - "release_date": "2025-05-06", - "last_updated": "2026-03-15", + "knowledge": "2024-10-24", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { "input": 1.25, "output": 10, - "reasoning": 10, - "cache_read": 0.125, - "cache_write": 0.375 + "cache_read": 0.13 }, "type": "chat" }, { - "id": "google/lyria-3-clip-preview", - "name": "Google: Lyria 3 Clip Preview", - "display_name": "Google: Lyria 3 Clip Preview", + "id": "phi-4-mini", + "name": "Phi-4-mini", + "display_name": "Phi-4-mini", "modalities": { "input": [ - "image", "text" ], "output": [ - "audio", "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-30", - "last_updated": "2026-04-11", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0, - "output": 0 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "google/gemini-3.1-pro-preview-customtools", - "name": "Google: Gemini 3.1 Pro Preview Custom Tools", - "display_name": "Google: Gemini 3.1 Pro Preview Custom Tools", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -65443,51 +68397,56 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ + "mode": "effort", + "effort": "medium", + "effort_options": [ "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", "high" ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-02-26", - "last_updated": "2026-03-15", + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 2, - "output": 12, - "reasoning": 12 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-lite-preview-09-2025", - "name": "Google: Gemini 2.5 Flash Lite Preview 09-2025", - "display_name": "Google: Gemini 2.5 Flash Lite Preview 09-2025", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -65497,52 +68456,49 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2026-03-15", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.1, - "output": 0.4, - "reasoning": 0.4, - "cache_read": 0.01, - "cache_write": 0.083333 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "google/gemini-2.0-flash-001", - "name": "Google: Gemini 2.0 Flash", - "display_name": "Google: Gemini 2.0 Flash", + "id": "gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ - "audio", - "image", - "pdf", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 8192, "output": 8192 }, "temperature": true, @@ -65550,362 +68506,258 @@ "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-12-11", - "last_updated": "2026-03-15", + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025, - "cache_write": 0.083333 + "input": 60, + "output": 120 }, "type": "chat" }, { - "id": "google/lyria-3-pro-preview", - "name": "Google: Lyria 3 Pro Preview", - "display_name": "Google: Lyria 3 Pro Preview", + "id": "phi-3-mini-4k-instruct", + "name": "Phi-3-mini-instruct (4k)", + "display_name": "Phi-3-mini-instruct (4k)", "modalities": { "input": [ - "image", "text" ], "output": [ - "audio", "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 4096, + "output": 1024 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-30", - "last_updated": "2026-04-11", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0, - "output": 0 + "input": 0.13, + "output": 0.52 }, "type": "chat" }, { - "id": "google/gemma-3n-e4b-it", - "name": "Google: Gemma 3n 4B", - "display_name": "Google: Gemma 3n 4B", + "id": "llama-3.2-11b-vision-instruct", + "name": "Llama-3.2-11B-Vision-Instruct", + "display_name": "Llama-3.2-11B-Vision-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 6554 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.02, - "output": 0.04 + "input": 0.37, + "output": 0.37 }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-lite-preview", - "name": "Google: Gemini 3.1 Flash Lite Preview", - "display_name": "Google: Gemini 3.1 Flash Lite Preview", + "id": "ministral-3b", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ - "audio", - "image", - "pdf", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-03", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-03", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.25, - "output": 1.5, - "reasoning": 1.5 + "input": 0.04, + "output": 0.04 }, "type": "chat" }, { - "id": "google/gemini-3.1-pro-preview", - "name": "Google: Gemini 3.1 Pro Preview", - "display_name": "Google: Gemini 3.1 Pro Preview", + "id": "meta-llama-3-8b-instruct", + "name": "Meta-Llama-3-8B-Instruct", + "display_name": "Meta-Llama-3-8B-Instruct", "modalities": { "input": [ - "audio", - "image", - "pdf", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-19", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 2, - "output": 12, - "reasoning": 12 + "input": 0.3, + "output": 0.61 }, "type": "chat" }, { - "id": "google/gemini-3-flash-preview", - "name": "Google: Gemini 3 Flash Preview", - "display_name": "Google: Gemini 3 Flash Preview", + "id": "gpt-4-32k", + "name": "GPT-4 32K", + "display_name": "GPT-4 32K", "modalities": { "input": [ - "audio", - "image", - "pdf", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2026-03-15", + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", "cost": { - "input": 0.5, - "output": 3, - "reasoning": 3, - "cache_read": 0.05, - "cache_write": 0.083333 + "input": 60, + "output": 120 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "Google: Gemini 2.5 Pro", - "display_name": "Google: Gemini 2.5 Pro", + "id": "mistral-medium-2505", + "name": "Mistral Medium 3", + "display_name": "Mistral Medium 3", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-03-20", - "last_updated": "2026-03-15", + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 1.25, - "output": 10, - "reasoning": 10, - "cache_read": 0.125, - "cache_write": 0.375 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "google/gemini-3-pro-image-preview", - "name": "Google: Nano Banana Pro (Gemini 3 Pro Image Preview)", - "display_name": "Google: Nano Banana Pro (Gemini 3 Pro Image Preview)", + "id": "cohere-command-a", + "name": "Command A", + "display_name": "Command A", "modalities": { "input": [ - "image", "text" ], "output": [ - "image", "text" ] }, "limit": { - "context": 65536, - "output": 32768 + "context": 256000, + "output": 8000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-20", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 2, - "output": 12, - "reasoning": 12 + "input": 2.5, + "output": 10 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "google/gemma-4-31b-it", - "name": "Google: Gemma 4 31B", - "display_name": "Google: Gemma 4 31B", + "id": "deepseek-v3.1", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 131072, "output": 131072 }, "temperature": true, @@ -65914,56 +68766,55 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-11", + "knowledge": "2024-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.14, - "output": 0.4 + "input": 0.56, + "output": 1.68 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-image", - "name": "Google: Nano Banana (Gemini 2.5 Flash Image)", - "display_name": "Google: Nano Banana (Gemini 2.5 Flash Image)", + "id": "gpt-3.5-turbo-0613", + "name": "GPT-3.5 Turbo 0613", + "display_name": "GPT-3.5 Turbo 0613", "modalities": { "input": [ - "image", "text" ], "output": [ - "image", "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 16384, + "output": 16384 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-08", - "last_updated": "2026-03-15", + "knowledge": "2021-08", + "release_date": "2023-06-13", + "last_updated": "2023-06-13", "cost": { - "input": 0.3, - "output": 2.5 + "input": 3, + "output": 4 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "google/gemma-3-12b-it", - "name": "Google: Gemma 3 12B", - "display_name": "Google: Gemma 3 12B", + "id": "cohere-embed-v3-english", + "name": "Embed v3 English", + "display_name": "Embed v3 English", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -65971,46 +68822,42 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 512, + "output": 1024 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-03-13", - "last_updated": "2026-03-15", + "release_date": "2023-11-07", + "last_updated": "2023-11-07", "cost": { - "input": 0.04, - "output": 0.13, - "cache_read": 0.015 + "input": 0.1, + "output": 0 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Google: Gemini 2.5 Flash", - "display_name": "Google: Gemini 2.5 Flash", + "id": "o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -66020,115 +68867,101 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-07-17", - "last_updated": "2026-03-15", + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 0.3, - "output": 2.5, - "reasoning": 2.5, - "cache_read": 0.03, - "cache_write": 0.083333 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-image-preview", - "name": "Google: Nano Banana 2 (Gemini 3.1 Flash Image Preview)", - "display_name": "Google: Nano Banana 2 (Gemini 3.1 Flash Image Preview)", + "id": "codex-mini", + "name": "Codex Mini", + "display_name": "Codex Mini", "modalities": { "input": [ - "image", "text" ], "output": [ - "image", "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": true, "open_weights": false, - "release_date": "2026-02-26", - "last_updated": "2026-03-15", + "knowledge": "2024-04", + "release_date": "2025-05-16", + "last_updated": "2025-05-16", "cost": { - "input": 0.5, - "output": 3 + "input": 1.5, + "output": 6, + "cache_read": 0.375 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "google/gemma-3-4b-it", - "name": "Google: Gemma 3 4B", - "display_name": "Google: Gemma 3 4B", + "id": "llama-3.2-90b-vision-instruct", + "name": "Llama-3.2-90B-Vision-Instruct", + "display_name": "Llama-3.2-90B-Vision-Instruct", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 19200 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": true, - "release_date": "2025-03-13", - "last_updated": "2026-03-15", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.04, - "output": 0.08 + "input": 2.04, + "output": 2.04 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro-preview", - "name": "Google: Gemini 2.5 Pro Preview 06-05", - "display_name": "Google: Gemini 2.5 Pro Preview 06-05", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "audio", - "image", - "pdf", "text" ], "output": [ @@ -66136,8 +68969,8 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -66148,39 +68981,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-12-02", "cost": { - "input": 1.25, - "output": 10, - "reasoning": 10, - "cache_read": 0.125, - "cache_write": 0.375 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "google/gemma-2-27b-it", - "name": "Google: Gemma 2 27B", - "display_name": "Google: Gemma 2 27B", + "id": "mai-ds-r1", + "name": "MAI-DS-R1", + "display_name": "MAI-DS-R1", "modalities": { "input": [ "text" @@ -66190,168 +69014,221 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2024-06-24", - "last_updated": "2024-06-24", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.65, - "output": 0.65 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "google/gemma-3-27b-it", - "name": "Google: Gemma 3 27B", - "display_name": "Google: Gemma 3 27B", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-12", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.03, - "output": 0.11, - "cache_read": 0.02 + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "google/gemma-4-26b-a4b-it", - "name": "Google: Gemma 4 26B A4B", - "display_name": "Google: Gemma 4 26B A4B", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "image", "text", - "video" + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-03", - "last_updated": "2026-04-11", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.12, - "output": 0.4 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-lite", - "name": "Google: Gemini 2.5 Flash Lite", - "display_name": "Google: Gemini 2.5 Flash Lite", + "id": "gpt-3.5-turbo-1106", + "name": "GPT-3.5 Turbo 1106", + "display_name": "GPT-3.5 Turbo 1106", "modalities": { "input": [ - "audio", - "image", - "pdf", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-06-17", - "last_updated": "2026-03-15", + "knowledge": "2021-08", + "release_date": "2023-11-06", + "last_updated": "2023-11-06", "cost": { - "input": 0.1, - "output": 0.4, - "reasoning": 0.4, - "cache_read": 0.01, - "cache_write": 0.083333 + "input": 1, + "output": 2 }, "type": "chat" }, { - "id": "google/gemini-2.0-flash-lite-001", - "name": "Google: Gemini 2.0 Flash Lite", - "display_name": "Google: Gemini 2.0 Flash Lite", + "id": "meta-llama-3-70b-instruct", + "name": "Meta-Llama-3-70B-Instruct", + "display_name": "Meta-Llama-3-70B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", + "cost": { + "input": 2.68, + "output": 3.54 + }, + "type": "chat" + }, + { + "id": "mistral-small-2503", + "name": "Mistral Small 3.1", + "display_name": "Mistral Small 3.1", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -66360,62 +69237,52 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-12-11", - "last_updated": "2026-03-15", + "knowledge": "2024-09", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 0.075, + "input": 0.1, "output": 0.3 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.5", - "name": "MoonshotAI: Kimi K2.5", - "display_name": "MoonshotAI: Kimi K2.5", + "id": "llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "display_name": "Llama 4 Scout 17B 16E Instruct", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65535 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-03-15", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.45, - "output": 2.2 + "input": 0.2, + "output": 0.78 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-0905", - "name": "MoonshotAI: Kimi K2 0905", - "display_name": "MoonshotAI: Kimi K2 0905", + "id": "text-embedding-3-small", + "name": "text-embedding-3-small", + "display_name": "text-embedding-3-small", "modalities": { "input": [ "text" @@ -66425,74 +69292,59 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 8191, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "open_weights": false, + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.15 + "input": 0.02, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "moonshotai/kimi-k2.6", - "name": "MoonshotAI: Kimi K2.6", - "display_name": "MoonshotAI: Kimi K2.6", + "id": "phi-3.5-mini-instruct", + "name": "Phi-3.5-mini-instruct", + "display_name": "Phi-3.5-mini-instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-20", - "last_updated": "2026-04-20", + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.13, + "output": 0.52 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2", - "name": "MoonshotAI: Kimi K2 0711", - "display_name": "MoonshotAI: Kimi K2 0711", + "id": "phi-3.5-moe-instruct", + "name": "Phi-3.5-MoE-instruct", + "display_name": "Phi-3.5-MoE-instruct", "modalities": { "input": [ "text" @@ -66502,28 +69354,29 @@ ] }, "limit": { - "context": 131000, - "output": 26215 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-07-11", - "last_updated": "2026-03-15", + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.55, - "output": 2.2 + "input": 0.16, + "output": 0.64 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "MoonshotAI: Kimi K2 Thinking", - "display_name": "MoonshotAI: Kimi K2 Thinking", + "id": "phi-3-small-8k-instruct", + "name": "Phi-3-small-instruct (8k)", + "display_name": "Phi-3-small-instruct (8k)", "modalities": { "input": [ "text" @@ -66533,73 +69386,60 @@ ] }, "limit": { - "context": 131072, - "output": 65535 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-11-06", - "last_updated": "2026-03-15", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.47, - "output": 2, - "cache_read": 0.2 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "aion-labs/aion-1.0", - "name": "AionLabs: Aion-1.0", - "display_name": "AionLabs: Aion-1.0", + "id": "model-router", + "name": "Model Router", + "display_name": "Model Router", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2026-03-15", + "release_date": "2025-05-19", + "last_updated": "2025-11-18", "cost": { - "input": 4, - "output": 8 + "input": 0.14, + "output": 0 }, "type": "chat" }, { - "id": "aion-labs/aion-rp-llama-3.1-8b", - "name": "AionLabs: Aion-RP 1.0 (8B)", - "display_name": "AionLabs: Aion-RP 1.0 (8B)", + "id": "phi-3-small-128k-instruct", + "name": "Phi-3-small-instruct (128k)", + "display_name": "Phi-3-small-instruct (128k)", "modalities": { "input": [ "text" @@ -66609,8 +69449,8 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": false, @@ -66618,19 +69458,58 @@ "supported": false }, "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "cost": { + "input": 0.15, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "gpt-5.1-chat", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text", + "image", + "audio" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2026-03-15", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.8, - "output": 1.6 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "aion-labs/aion-2.0", - "name": "AionLabs: Aion-2.0", - "display_name": "AionLabs: Aion-2.0", + "id": "phi-4-reasoning", + "name": "Phi-4-reasoning", + "display_name": "Phi-4-reasoning", "modalities": { "input": [ "text" @@ -66640,8 +69519,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 32000, + "output": 4096 }, "temperature": true, "tool_call": false, @@ -66650,51 +69529,76 @@ "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-03-15", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.8, - "output": 1.6 + "input": 0.125, + "output": 0.5 }, "type": "chat" }, { - "id": "aion-labs/aion-1.0-mini", - "name": "AionLabs: Aion-1.0-Mini", - "display_name": "AionLabs: Aion-1.0-Mini", + "id": "gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": false, "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2026-03-15", + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.7, - "output": 1.4 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "thedrummer/unslopnemo-12b", - "name": "TheDrummer: UnslopNemo 12B", - "display_name": "TheDrummer: UnslopNemo 12B", + "id": "gpt-3.5-turbo-instruct", + "name": "GPT-3.5 Turbo Instruct", + "display_name": "GPT-3.5 Turbo Instruct", "modalities": { "input": [ "text" @@ -66704,28 +69608,29 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 4096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-11-09", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2023-09-21", + "last_updated": "2023-09-21", "cost": { - "input": 0.4, - "output": 0.4 + "input": 1.5, + "output": 2 }, "type": "chat" }, { - "id": "thedrummer/cydonia-24b-v4.1", - "name": "TheDrummer: Cydonia 24B V4.1", - "display_name": "TheDrummer: Cydonia 24B V4.1", + "id": "phi-3-mini-128k-instruct", + "name": "Phi-3-mini-instruct (128k)", + "display_name": "Phi-3-mini-instruct (128k)", "modalities": { "input": [ "text" @@ -66735,8 +69640,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": false, @@ -66745,18 +69650,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-09-27", - "last_updated": "2026-03-15", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.3, - "output": 0.5 + "input": 0.13, + "output": 0.52 }, "type": "chat" }, { - "id": "thedrummer/skyfall-36b-v2", - "name": "TheDrummer: Skyfall 36B V2", - "display_name": "TheDrummer: Skyfall 36B V2", + "id": "mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -66766,28 +69672,29 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-03-11", - "last_updated": "2026-03-15", + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.55, - "output": 0.8 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "thedrummer/rocinante-12b", - "name": "TheDrummer: Rocinante 12B", - "display_name": "TheDrummer: Rocinante 12B", + "id": "phi-4", + "name": "Phi-4", + "display_name": "Phi-4", "modalities": { "input": [ "text" @@ -66797,32 +69704,31 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-09-30", - "last_updated": "2026-03-15", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.17, - "output": 0.43 + "input": 0.125, + "output": 0.5 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.1", - "name": "Anthropic: Claude Opus 4.1", - "display_name": "Anthropic: Claude Opus 4.1", + "id": "phi-3-medium-4k-instruct", + "name": "Phi-3-medium-instruct (4k)", + "display_name": "Phi-3-medium-instruct (4k)", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -66830,35 +69736,31 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 4096, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.17, + "output": 0.68 }, "type": "chat" }, { - "id": "anthropic/claude-3.7-sonnet:thinking", - "name": "Anthropic: Claude 3.7 Sonnet (thinking)", - "display_name": "Anthropic: Claude 3.7 Sonnet (thinking)", + "id": "deepseek-v3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -66866,8 +69768,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -66877,43 +69779,26 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.58, + "output": 1.68 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6-fast", - "name": "Anthropic: Claude Opus 4.6 (Fast)", - "display_name": "Anthropic: Claude Opus 4.6 (Fast)", + "id": "codestral-2501", + "name": "Codestral 25.01", + "display_name": "Codestral 25.01", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -66921,62 +69806,31 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-04-07", - "last_updated": "2026-04-11", + "knowledge": "2024-03", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 30, - "output": 150, - "cache_read": 3, - "cache_write": 37.5 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "anthropic/claude-3.7-sonnet", - "name": "Anthropic: Claude 3.7 Sonnet", - "display_name": "Anthropic: Claude 3.7 Sonnet", + "id": "phi-3-medium-128k-instruct", + "name": "Phi-3-medium-instruct (128k)", + "display_name": "Phi-3-medium-instruct (128k)", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -66984,177 +69838,95 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.17, + "output": 0.68 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6", - "name": "Anthropic: Claude Opus 4.6", - "display_name": "Anthropic: Claude Opus 4.6", + "id": "deepseek-v3.2-speciale", + "name": "DeepSeek-V3.2-Speciale", + "display_name": "DeepSeek-V3.2-Speciale", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 128000, "output": 128000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.58, + "output": 1.68 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.7", - "name": "Anthropic: Claude Opus 4.7", - "display_name": "Anthropic: Claude Opus 4.7", + "id": "cohere-embed-v3-multilingual", + "name": "Embed v3 Multilingual", + "display_name": "Embed v3 Multilingual", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 512, + "output": 1024 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-16", - "last_updated": "2026-05-01", + "attachment": false, + "open_weights": true, + "release_date": "2023-11-07", + "last_updated": "2023-11-07", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.1, + "output": 0 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4", - "name": "Anthropic: Claude Sonnet 4", - "display_name": "Anthropic: Claude Sonnet 4", + "id": "deepseek-v3-0324", + "name": "DeepSeek-V3-0324", + "display_name": "DeepSeek-V3-0324", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -67162,35 +69934,31 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1.14, + "output": 4.56 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.5", - "name": "Anthropic: Claude Sonnet 4.5", - "display_name": "Anthropic: Claude Sonnet 4.5", + "id": "deepseek-r1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -67198,8 +69966,8 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, @@ -67207,96 +69975,120 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.5", - "name": "Anthropic: Claude Opus 4.5", - "display_name": "Anthropic: Claude Opus 4.5", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex Mini", + "display_name": "GPT-5.1 Codex Mini", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-11-24", - "last_updated": "2026-03-15", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "anthropic/claude-3-haiku", - "name": "Anthropic: Claude 3 Haiku", - "display_name": "Anthropic: Claude 3 Haiku", + "id": "text-embedding-ada-002", + "name": "text-embedding-ada-002", + "display_name": "text-embedding-ada-002", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-03-07", - "last_updated": "2024-03-07", + "release_date": "2022-12-15", + "last_updated": "2022-12-15", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 + "input": 0.1, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "anthropic/claude-opus-4", - "name": "Anthropic: Claude Opus 4", - "display_name": "Anthropic: Claude Opus 4", + "id": "o1-preview", + "name": "o1-preview", + "display_name": "o1-preview", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -67304,31 +70096,45 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2026-03-15", + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 16.5, + "output": 66, + "cache_read": 8.25 }, "type": "chat" }, { - "id": "anthropic/claude-3.5-haiku", - "name": "Anthropic: Claude 3.5 Haiku", - "display_name": "Anthropic: Claude 3.5 Haiku", + "id": "llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", "modalities": { "input": [ "text", @@ -67339,7 +70145,7 @@ ] }, "limit": { - "context": 200000, + "context": 128000, "output": 8192 }, "temperature": true, @@ -67348,24 +70154,22 @@ "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4.5", - "name": "Anthropic: Claude Haiku 4.5", - "display_name": "Anthropic: Claude Haiku 4.5", + "id": "deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -67373,91 +70177,41 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 163840, + "output": 163840 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", - "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 - }, - "type": "chat" - }, - { - "id": "anthropic/claude-sonnet-4.6", - "name": "Anthropic: Claude Sonnet 4.6", - "display_name": "Anthropic: Claude Sonnet 4.6", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 128000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": false - }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 3, - "output": 15 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "switchpoint/router", - "name": "Switchpoint Router", - "display_name": "Switchpoint Router", + "id": "meta-llama-3.1-70b-instruct", + "name": "Meta-Llama-3.1-70B-Instruct", + "display_name": "Meta-Llama-3.1-70B-Instruct", "modalities": { "input": [ "text" @@ -67467,32 +70221,31 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-12", - "last_updated": "2026-03-15", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.85, - "output": 3.4 + "input": 2.68, + "output": 3.54 }, "type": "chat" }, { - "id": "bytedance/ui-tars-1.5-7b", - "name": "ByteDance: UI-TARS 7B ", - "display_name": "ByteDance: UI-TARS 7B ", + "id": "gpt-3.5-turbo-0125", + "name": "GPT-3.5 Turbo 0125", + "display_name": "GPT-3.5 Turbo 0125", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -67500,202 +70253,186 @@ ] }, "limit": { - "context": 128000, - "output": 2048 + "context": 16384, + "output": 16384 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-07-23", - "last_updated": "2026-03-15", + "knowledge": "2021-08", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0.1, - "output": 0.2 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "tngtech/deepseek-r1t2-chimera", - "name": "TNG: DeepSeek R1T2 Chimera", - "display_name": "TNG: DeepSeek R1T2 Chimera", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-08", - "last_updated": "2025-07-08", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.25, - "output": 0.85, + "input": 1.75, + "output": 14, "cache_read": 0.125 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2.5-pro", - "name": "Xiaomi: MiMo V2.5 Pro", - "display_name": "Xiaomi: MiMo V2.5 Pro", + "id": "gpt-4-turbo-vision", + "name": "GPT-4 Turbo Vision", + "display_name": "GPT-4 Turbo Vision", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "attachment": true, + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2, - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-omni", - "name": "Xiaomi: MiMo-V2-Omni", - "display_name": "Xiaomi: MiMo-V2-Omni", + "id": "meta-llama-3.1-405b-instruct", + "name": "Meta-Llama-3.1-405B-Instruct", + "display_name": "Meta-Llama-3.1-405B-Instruct", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08 + "input": 5.33, + "output": 16 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2.5", - "name": "Xiaomi: MiMo-V2.5", - "display_name": "Xiaomi: MiMo-V2.5", + "id": "phi-4-multimodal", + "name": "Phi-4-multimodal", + "display_name": "Phi-4-multimodal", "modalities": { "input": [ "text", "image", - "audio", - "video" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08, - "context_over_200k": { - "input": 0.8, - "output": 4, - "cache_read": 0.16 - } + "input": 0.08, + "output": 0.32, + "input_audio": 4 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-pro", - "name": "Xiaomi: MiMo-V2-Pro", - "display_name": "Xiaomi: MiMo-V2-Pro", + "id": "gpt-3.5-turbo-0301", + "name": "GPT-3.5 Turbo 0301", + "display_name": "GPT-3.5 Turbo 0301", "modalities": { "input": [ "text" @@ -67705,36 +70442,29 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 4096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2021-08", + "release_date": "2023-03-01", + "last_updated": "2023-03-01", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2, - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 1.5, + "output": 2 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash", - "name": "Xiaomi: MiMo-V2-Flash", - "display_name": "Xiaomi: MiMo-V2-Flash", + "id": "phi-4-reasoning-plus", + "name": "Phi-4-reasoning-plus", + "display_name": "Phi-4-reasoning-plus", "modalities": { "input": [ "text" @@ -67744,152 +70474,142 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 32000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.09, - "output": 0.29, - "cache_read": 0.045 + "input": 0.125, + "output": 0.5 }, "type": "chat" - } - ] - }, - "sap-ai-core": { - "id": "sap-ai-core", - "name": "SAP AI Core", - "display_name": "SAP AI Core", - "doc": "https://help.sap.com/docs/sap-ai-core", - "models": [ + }, { - "id": "anthropic--claude-4.6-opus", - "name": "anthropic--claude-4.6-opus", - "display_name": "anthropic--claude-4.6-opus", + "id": "mistral-large-2411", + "name": "Mistral Large 24.11", + "display_name": "Mistral Large 24.11", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "anthropic--claude-3-haiku", - "name": "anthropic--claude-3-haiku", - "display_name": "anthropic--claude-3-haiku", + "id": "text-embedding-3-large", + "name": "text-embedding-3-large", + "display_name": "text-embedding-3-large", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 8191, + "output": 3072 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-13", - "last_updated": "2024-03-13", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 + "input": 0.13, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "anthropic--claude-3-opus", - "name": "anthropic--claude-3-opus", - "display_name": "anthropic--claude-3-opus", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-02-06", + "last_updated": "2026-02-06", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.6, + "output": 3 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "gpt-5-mini", - "display_name": "gpt-5-mini", + "id": "gpt-5.4-nano", + "name": "GPT-5.4 Nano", + "display_name": "GPT-5.4 Nano", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -67903,19 +70623,20 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ - "minimal", + "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -67928,50 +70649,52 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "gpt-5-nano", - "name": "gpt-5-nano", - "display_name": "gpt-5-nano", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1050000, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ - "minimal", + "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -67984,26 +70707,40 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + }, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "gemini-2.5-pro", - "display_name": "gemini-2.5-pro", + "id": "gpt-5.4-mini", + "name": "GPT-5.4 Mini", + "display_name": "GPT-5.4 Mini", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -68011,107 +70748,121 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-25", - "last_updated": "2025-06-05", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "anthropic--claude-3.7-sonnet", - "name": "anthropic--claude-3.7-sonnet", - "display_name": "anthropic--claude-3.7-sonnet", + "id": "gpt-5.4-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 30, + "output": 180, + "context_over_200k": { + "input": 60, + "output": 270 + }, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "sonar-pro", - "name": "sonar-pro", - "display_name": "sonar-pro", + "id": "o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ "text", @@ -68123,33 +70874,47 @@ }, "limit": { "context": 200000, - "output": 8192 + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 3, - "output": 15 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "anthropic--claude-4.5-sonnet", - "name": "anthropic--claude-4.5-sonnet", - "display_name": "anthropic--claude-4.5-sonnet", + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -68157,108 +70922,131 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "anthropic--claude-4.6-sonnet", - "name": "anthropic--claude-4.6-sonnet", - "display_name": "anthropic--claude-4.6-sonnet", + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-08", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 }, "type": "chat" }, { - "id": "sonar-deep-research", - "name": "sonar-deep-research", - "display_name": "sonar-deep-research", + "id": "gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 1047576, "output": 32768 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-02-01", - "last_updated": "2025-09-01", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 2, - "output": 8, - "reasoning": 3 + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "gemini-2.5-flash", - "display_name": "gemini-2.5-flash", + "id": "gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -68266,10 +71054,10 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -68279,79 +71067,91 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-25", - "last_updated": "2025-06-05", + "knowledge": "2025-12-01", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.03, - "input_audio": 1 + "input": 5, + "output": 30, + "cache_read": 0.5, + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + }, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "anthropic--claude-4.5-opus", - "name": "anthropic--claude-4.5-opus", - "display_name": "anthropic--claude-4.5-opus", + "id": "cohere-command-r-08-2024", + "name": "Command R", + "display_name": "Command R", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "sonar", - "name": "sonar", - "display_name": "sonar", + "id": "gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -68362,75 +71162,71 @@ "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 1, - "output": 1 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "anthropic--claude-4-opus", - "name": "anthropic--claude-4-opus", - "display_name": "anthropic--claude-4-opus", + "id": "gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "anthropic--claude-3-sonnet", - "name": "anthropic--claude-3-sonnet", - "display_name": "anthropic--claude-3-sonnet", + "id": "gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -68439,152 +71235,135 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-04", - "last_updated": "2024-03-04", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "anthropic--claude-4-sonnet", - "name": "anthropic--claude-4-sonnet", - "display_name": "anthropic--claude-4-sonnet", + "id": "gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 272000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "gemini-2.5-flash-lite", - "display_name": "gemini-2.5-flash-lite", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "anthropic--claude-4.5-haiku", - "name": "anthropic--claude-4.5-haiku", - "display_name": "anthropic--claude-4.5-haiku", + "id": "cohere-command-r-plus-08-2024", + "name": "Command R+", + "display_name": "Command R+", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "gpt-5", - "name": "gpt-5", - "display_name": "gpt-5", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ "text", @@ -68595,86 +71374,70 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 1.25, + "input": 2.5, "output": 10, - "cache_read": 0.125 + "cache_read": 1.25 }, "type": "chat" - }, + } + ] + }, + "ovhcloud": { + "id": "ovhcloud", + "name": "OVHcloud AI Endpoints", + "display_name": "OVHcloud AI Endpoints", + "api": "https://oai.endpoints.kepler.ai.cloud.ovh.net/v1", + "doc": "https://www.ovhcloud.com/en/public-cloud/ai-endpoints/catalog//", + "models": [ { - "id": "gpt-4.1", - "name": "gpt-4.1", - "display_name": "gpt-4.1", + "id": "mistral-7b-instruct-v0.3", + "name": "Mistral-7B-Instruct-v0.3", + "display_name": "Mistral-7B-Instruct-v0.3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-01", + "last_updated": "2025-04-01", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.11, + "output": 0.11 }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "gpt-4.1-mini", - "display_name": "gpt-4.1-mini", + "id": "qwen2.5-vl-72b-instruct", + "name": "Qwen2.5-VL-72B-Instruct", + "display_name": "Qwen2.5-VL-72B-Instruct", "modalities": { "input": [ "text", @@ -68685,43 +71448,40 @@ ] }, "limit": { - "context": 1047576, + "context": 32768, "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "release_date": "2025-03-31", + "last_updated": "2025-03-31", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 1.01, + "output": 1.01 }, "type": "chat" }, { - "id": "anthropic--claude-3.5-sonnet", - "name": "anthropic--claude-3.5-sonnet", - "display_name": "anthropic--claude-3.5-sonnet", + "id": "mistral-small-3.2-24b-instruct-2506", + "name": "Mistral-Small-3.2-24B-Instruct-2506", + "display_name": "Mistral-Small-3.2-24B-Instruct-2506", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -68729,31 +71489,19 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "open_weights": true, + "release_date": "2025-07-16", + "last_updated": "2025-07-16", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.1, + "output": 0.31 }, "type": "chat" - } - ] - }, - "morph": { - "id": "morph", - "name": "Morph", - "display_name": "Morph", - "api": "https://api.morphllm.com/v1", - "doc": "https://docs.morphllm.com/api-reference/introduction", - "models": [ + }, { - "id": "auto", - "name": "Auto", - "display_name": "Auto", + "id": "mistral-nemo-instruct-2407", + "name": "Mistral-Nemo-Instruct-2407", + "display_name": "Mistral-Nemo-Instruct-2407", "modalities": { "input": [ "text" @@ -68763,59 +71511,71 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 65536, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "open_weights": true, + "release_date": "2024-11-20", + "last_updated": "2024-11-20", "cost": { - "input": 0.85, - "output": 1.55 + "input": 0.14, + "output": 0.14 }, "type": "chat" }, { - "id": "morph-v3-fast", - "name": "Morph v3 Fast", - "display_name": "Morph v3 Fast", + "id": "qwen3.5-9b", + "name": "Qwen3.5-9B", + "display_name": "Qwen3.5-9B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 16000 + "context": 262144, + "output": 262144 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, - "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 0.8, - "output": 1.2 + "input": 0.1, + "output": 0.15 }, "type": "chat" }, { - "id": "morph-v3-large", - "name": "Morph v3 Large", - "display_name": "Morph v3 Large", + "id": "gpt-oss-20b", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ "text" @@ -68825,51 +71585,9 @@ ] }, "limit": { - "context": 32000, - "output": 32000 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", - "cost": { - "input": 0.9, - "output": 1.9 - }, - "type": "chat" - } - ] - }, - "cloudflare-ai-gateway": { - "id": "cloudflare-ai-gateway", - "name": "Cloudflare AI Gateway", - "display_name": "Cloudflare AI Gateway", - "doc": "https://developers.cloudflare.com/ai-gateway/", - "models": [ - { - "id": "openai/gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 131072 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -68877,277 +71595,217 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.05, + "output": 0.18 }, "type": "chat" }, { - "id": "openai/gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "meta-llama-3_3-70b-instruct", + "name": "Meta-Llama-3_3-70B-Instruct", + "display_name": "Meta-Llama-3_3-70B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-01", + "last_updated": "2025-04-01", "cost": { - "input": 10, - "output": 30 + "input": 0.74, + "output": 0.74 }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "qwen3-32b", + "name": "Qwen3-32B", + "display_name": "Qwen3-32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32768, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-16", + "last_updated": "2025-07-16", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.09, + "output": 0.25 }, "type": "chat" }, { - "id": "openai/o3-pro", - "name": "o3-pro", - "display_name": "o3-pro", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder-30B-A3B-Instruct", + "display_name": "Qwen3-Coder-30B-A3B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-06-10", - "last_updated": "2025-06-10", + "attachment": false, + "open_weights": true, + "release_date": "2025-10-28", + "last_updated": "2025-10-28", "cost": { - "input": 20, - "output": 80 + "input": 0.07, + "output": 0.26 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "input": 0.09, + "output": 0.47 }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "llama-3.1-8b-instruct", + "name": "Llama-3.1-8B-Instruct", + "display_name": "Llama-3.1-8B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "attachment": false, + "open_weights": true, + "release_date": "2025-06-11", + "last_updated": "2025-06-11", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 0.11, + "output": 0.11 }, "type": "chat" - }, + } + ] + }, + "friendli": { + "id": "friendli", + "name": "Friendli", + "display_name": "Friendli", + "api": "https://api.friendli.ai/serverless/v1", + "doc": "https://friendli.ai/docs/guides/serverless_endpoints/introduction", + "models": [ { - "id": "openai/gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "zai-org/GLM-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 202752, + "output": 202752 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -69156,145 +71814,104 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 1, + "output": 3.2, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "zai-org/GLM-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 202752, + "output": 202752 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "openai/o1", - "name": "o1", - "display_name": "o1", + "id": "meta-llama/Llama-3.1-8B-Instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 8000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "attachment": false, + "open_weights": true, + "release_date": "2024-08-01", + "last_updated": "2025-12-23", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo", - "name": "GPT-3.5-turbo", - "display_name": "GPT-3.5-turbo", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -69304,30 +71921,28 @@ ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2021-09-01", - "release_date": "2023-03-01", - "last_updated": "2023-11-06", + "open_weights": true, + "release_date": "2024-08-01", + "last_updated": "2025-12-23", "cost": { - "input": 0.5, - "output": 1.5, - "cache_read": 1.25 + "input": 0.6, + "output": 0.6 }, "type": "chat" }, { - "id": "openai/o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -69337,10 +71952,10 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 196608, + "output": 196608 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -69349,33 +71964,29 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "openai/gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -69385,170 +71996,150 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-29", + "last_updated": "2026-01-29", "cost": { - "input": 30, - "output": 60 + "input": 0.2, + "output": 0.8 }, "type": "chat" - }, + } + ] + }, + "regolo-ai": { + "id": "regolo-ai", + "name": "Regolo AI", + "display_name": "Regolo AI", + "api": "https://api.regolo.ai/v1", + "doc": "https://docs.regolo.ai/", + "models": [ { - "id": "openai/gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "qwen3.5-122b", + "name": "Qwen3.5-122B", + "display_name": "Qwen3.5-122B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 262144, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "open_weights": true, + "release_date": "2026-02-01", + "last_updated": "2026-02-01", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 0.9, + "output": 3.6 }, "type": "chat" }, { - "id": "openai/o3", - "name": "o3", - "display_name": "o3", + "id": "mistral-small3.2", + "name": "Mistral Small 3.2", + "display_name": "Mistral Small 3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 120000, + "output": 120000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.5, + "output": 2.2 }, "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "minimax-m2.5", + "name": "MiniMax 2.5", + "display_name": "MiniMax 2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 190000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "release_date": "2026-03-10", + "last_updated": "2026-03-10", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.8, + "output": 3.5 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "qwen3.5-9b", + "name": "Qwen3.5-9B", + "display_name": "Qwen3.5-9B", "modalities": { "input": [ "text", @@ -69559,65 +72150,51 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": true, + "release_date": "2026-02-01", + "last_updated": "2026-02-01", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4-5", - "name": "Claude Haiku 4.5 (latest)", - "display_name": "Claude Haiku 4.5 (latest)", + "id": "gpt-oss-20b", + "name": "GPT-OSS-20B", + "display_name": "GPT-OSS-20B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -69630,166 +72207,95 @@ "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-01", + "last_updated": "2026-03-01", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.4, + "output": 1.8 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "qwen3-coder-next", + "name": "Qwen3-Coder-Next", + "display_name": "Qwen3-Coder-Next", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-01", + "last_updated": "2026-03-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5 - } + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "qwen3-embedding-8b", + "name": "Qwen3-Embedding-8B", + "display_name": "Qwen3-Embedding-8B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 32768, + "output": 8192 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2026-01", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-01", + "last_updated": "2026-02-01", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.1, + "output": 0.1 }, - "type": "chat" + "type": "embedding" }, { - "id": "anthropic/claude-opus-4-1", - "name": "Claude Opus 4.1 (latest)", - "display_name": "Claude Opus 4.1 (latest)", + "id": "mistral-small-4-119b", + "name": "Mistral Small 4 119B", + "display_name": "Mistral Small 4 119B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -69797,113 +72303,93 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-03-15", + "last_updated": "2026-03-15", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.75, + "output": 3 }, "type": "chat" }, { - "id": "anthropic/claude-3-5-haiku", - "name": "Claude Haiku 3.5 (latest)", - "display_name": "Claude Haiku 3.5 (latest)", + "id": "qwen3-reranker-4b", + "name": "Qwen3-Reranker-4B", + "display_name": "Qwen3-Reranker-4B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 32768, "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-01", + "last_updated": "2026-02-01", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 0.12, + "output": 0.12 }, - "type": "chat" + "type": "rerank" }, { - "id": "anthropic/claude-3.5-sonnet", - "name": "Claude Sonnet 3.5 v2", - "display_name": "Claude Sonnet 3.5 v2", + "id": "llama-3.3-70b-instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.6, + "output": 2.7 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4 (latest)", - "display_name": "Claude Sonnet 4 (latest)", + "id": "gpt-oss-120b", + "name": "GPT-OSS-120B", + "display_name": "GPT-OSS-120B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -69911,78 +72397,151 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1, + "output": 4.2 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-5", - "name": "Claude Opus 4.5 (latest)", - "display_name": "Claude Opus 4.5 (latest)", + "id": "qwen-image", + "name": "Qwen-Image", + "display_name": "Qwen-Image", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 8192, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-01", + "last_updated": "2026-03-01", + "cost": { + "input": 0.5, + "output": 2 + }, + "type": "imageGeneration" + }, + { + "id": "llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 120000, + "output": 120000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-07", + "last_updated": "2025-04-07", + "cost": { + "input": 0.05, + "output": 0.25 + }, + "type": "chat" + } + ] + }, + "claudinio": { + "id": "claudinio", + "name": "Claudinio", + "display_name": "Claudinio", + "api": "https://api.claudin.io/v1", + "doc": "https://claudin.io", + "models": [ + { + "id": "claudinio", + "name": "Claudinio", + "display_name": "Claudinio", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 256000, "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "knowledge": "2026-05", + "release_date": "2026-05-12", + "last_updated": "2026-05-12", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.5, + "output": 2, + "cache_read": 0.05 }, "type": "chat" - }, + } + ] + }, + "orcarouter": { + "id": "orcarouter", + "name": "OrcaRouter", + "display_name": "OrcaRouter", + "api": "https://api.orcarouter.ai/v1", + "doc": "https://docs.orcarouter.ai", + "models": [ { - "id": "anthropic/claude-3-haiku", - "name": "Claude Haiku 3", - "display_name": "Claude Haiku 3", + "id": "orcarouter/auto", + "name": "OrcaRouter Auto", + "display_name": "OrcaRouter Auto", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -69991,34 +72550,30 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-13", - "last_updated": "2024-03-13", + "release_date": "2025-01-01", + "last_updated": "2026-05-14", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4", - "name": "Claude Opus 4 (latest)", - "display_name": "Claude Opus 4 (latest)", + "id": "grok/grok-4.3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -70026,141 +72581,133 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2026-05-01", + "last_updated": "2026-05-01", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2, + "context_over_200k": { + "input": 2.5, + "output": 5, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 2.5, + "output": 5, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-6", - "name": "Claude Opus 4.6 (latest)", - "display_name": "Claude Opus 4.6 (latest)", + "id": "z-ai/glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25, - "context_over_200k": { - "input": 10, - "output": 37.5, - "cache_read": 1, - "cache_write": 12.5 - } + "input": 1.4, + "output": 4.4, + "cache_read": 0.26, + "cache_write": 0 }, "type": "chat" }, { - "id": "anthropic/claude-3.5-haiku", - "name": "Claude Haiku 3.5 (latest)", - "display_name": "Claude Haiku 3.5 (latest)", + "id": "z-ai/glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, + "cache_write": 0 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-5", - "name": "Claude Sonnet 4.5 (latest)", - "display_name": "Claude Sonnet 4.5 (latest)", + "id": "z-ai/glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -70173,110 +72720,117 @@ "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "anthropic/claude-3-sonnet", - "name": "Claude Sonnet 3", - "display_name": "Claude Sonnet 3", + "id": "z-ai/glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-04", - "last_updated": "2024-03-04", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 0.3 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "anthropic/claude-3-opus", - "name": "Claude Opus 3", - "display_name": "Claude Opus 3", + "id": "z-ai/glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "z-ai/glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -70285,54 +72839,65 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "cost": { + "input": 1, + "output": 3.2, + "cache_read": 0.2, + "cache_write": 0 + }, + "type": "chat" + }, + { + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" - } - ] - }, - "github-copilot": { - "id": "github-copilot", - "name": "GitHub Copilot", - "display_name": "GitHub Copilot", - "api": "https://api.githubcopilot.com", - "doc": "https://docs.github.com/en/copilot", - "models": [ + }, { - "id": "gpt-5.1-codex-max", - "name": "GPT-5.1-Codex-max", - "display_name": "GPT-5.1-Codex-max", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", @@ -70362,7 +72927,8 @@ "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -70375,19 +72941,53 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-12-04", - "last_updated": "2025-12-04", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0, - "output": 0 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "claude-opus-4.6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "openai/gpt-3.5-turbo", + "name": "GPT-3.5-turbo", + "display_name": "GPT-3.5-turbo", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16385, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2021-09-01", + "release_date": "2023-03-01", + "last_updated": "2023-11-06", + "cost": { + "input": 0.5, + "output": 1.5, + "cache_read": 1.25 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5.4-nano", + "name": "GPT-5.4 nano", + "display_name": "GPT-5.4 nano", "modalities": { "input": [ "text", @@ -70398,10 +72998,10 @@ ] }, "limit": { - "context": 144000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -70411,43 +73011,40 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", + "mode": "effort", + "effort": "none", "effort_options": [ + "none", "low", "medium", - "high" + "high", + "xhigh" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0, - "output": 0 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "openai/gpt-5-chat-latest", + "name": "GPT-5 Chat (latest)", + "display_name": "GPT-5 Chat (latest)", "modalities": { "input": [ "text", @@ -70458,63 +73055,45 @@ ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 400000, + "output": 128000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash", - "display_name": "Gemini 3 Flash", + "id": "openai/gpt-5.5-pro", + "name": "GPT-5.5 Pro", + "display_name": "GPT-5.5 Pro", "modalities": { "input": [ "text", "image", - "audio", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -70522,38 +73101,38 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0, - "output": 0 + "input": 30, + "output": 180, + "context_over_200k": { + "input": 60, + "output": 270 + }, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "openai/gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex mini", + "display_name": "GPT-5.1 Codex mini", "modalities": { "input": [ "text", @@ -70571,19 +73150,19 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ + "none", "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -70594,21 +73173,22 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5-mini", - "display_name": "GPT-5-mini", + "id": "openai/gpt-5.2-pro", + "name": "GPT-5.2 Pro", + "display_name": "GPT-5.2 Pro", "modalities": { "input": [ "text", @@ -70619,10 +73199,10 @@ ] }, "limit": { - "context": 264000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -70633,12 +73213,11 @@ "supported": true, "default_enabled": true, "mode": "effort", - "effort": "medium", + "effort": "high", "effort_options": [ - "minimal", - "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -70651,25 +73230,23 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-08-13", - "last_updated": "2025-08-13", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0, - "output": 0 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "openai/gpt-4o-2024-05-13", + "name": "GPT-4o (2024-05-13)", + "display_name": "GPT-4o (2024-05-13)", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ "text" @@ -70677,46 +73254,28 @@ }, "limit": { "context": 128000, - "output": 64000 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 15 }, "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3-Codex", - "display_name": "GPT-5.3-Codex", + "id": "openai/gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ "text", @@ -70743,10 +73302,10 @@ "mode": "effort", "effort": "medium", "effort_options": [ + "minimal", "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -70759,25 +73318,24 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "openai/gpt-5.1-chat-latest", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ "text" @@ -70785,48 +73343,65 @@ }, "limit": { "context": 128000, - "output": 64000 + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + }, + "type": "chat" + }, + { + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1047576, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0, - "output": 0 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "openai/gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ "text", @@ -70837,28 +73412,21 @@ ] }, "limit": { - "context": 264000, - "output": 64000 + "context": 400000, + "output": 272000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], + "default_enabled": true, + "mode": "fixed", + "effort": "high", "verbosity": "medium", "verbosity_options": [ "low", @@ -70870,19 +73438,54 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 0, - "output": 0 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 Mini", - "display_name": "GPT-5.4 Mini", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1047576, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ "text", @@ -70912,8 +73515,7 @@ "none", "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -70926,19 +73528,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "claude-opus-4.7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ "text", @@ -70949,80 +73552,80 @@ ] }, "limit": { - "context": 144000, - "output": 64000 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "high", + "effort": "medium", "effort_options": [ + "minimal", "low", "medium", - "high", - "xhigh" + "high" ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2-Codex", - "display_name": "GPT-5.2-Codex", + "id": "openai/gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1050000, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ + "none", "low", "medium", "high", @@ -71037,21 +73640,106 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 22.5, + "cache_read": 0.25, + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + }, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1-Codex-mini", - "display_name": "GPT-5.1-Codex-mini", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 + }, + "type": "chat" + }, + { + "id": "openai/gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", + "cost": { + "input": 10, + "output": 30 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5.4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", "modalities": { "input": [ "text", @@ -71081,7 +73769,8 @@ "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -71092,21 +73781,22 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0, - "output": 0 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "openai/gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ "text", @@ -71117,43 +73807,67 @@ ] }, "limit": { - "context": 216000, - "output": 16000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "openai/gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -71161,24 +73875,57 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-08", - "release_date": "2025-08-27", - "last_updated": "2025-08-27", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 30, + "cache_read": 0.5, + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + }, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "openai/gpt-5.4-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ "text", @@ -71189,26 +73936,25 @@ ] }, "limit": { - "context": 264000, - "output": 64000 + "context": 1050000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "high", "effort_options": [ - "none", - "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -71221,19 +73967,33 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0, - "output": 0 + "input": 60, + "output": 270, + "context_over_200k": { + "input": 60, + "output": 270 + }, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "claude-sonnet-4.5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "openai/gpt-5.2-chat-latest", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ "text", @@ -71244,10 +74004,10 @@ ] }, "limit": { - "context": 144000, - "output": 32000 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -71255,19 +74015,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0, - "output": 0 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "claude-opus-41", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ "text", @@ -71278,64 +74039,62 @@ ] }, "limit": { - "context": 80000, - "output": 16000 + "context": 1047576, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "claude-opus-4.5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "openai/gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 160000, - "output": 32000 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0, - "output": 0 + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "openai/gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ "text", @@ -71365,8 +74124,7 @@ "none", "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -71377,21 +74135,22 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "openai/gpt-4o-2024-11-20", + "name": "GPT-4o (2024-11-20)", + "display_name": "GPT-4o (2024-11-20)", "modalities": { "input": [ "text", @@ -71403,7 +74162,7 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -71413,32 +74172,34 @@ "attachment": true, "open_weights": false, "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", "cost": { - "input": 0, - "output": 0 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "openai/gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -71451,10 +74212,10 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "minimal", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -71467,19 +74228,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0, - "output": 0 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "claude-haiku-4.5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ "text", @@ -71490,63 +74252,109 @@ ] }, "limit": { - "context": 144000, - "output": 32000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "openai/gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0, - "output": 0 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "claude-sonnet-4.6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "openai/gpt-4o-2024-08-06", + "name": "GPT-4o (2024-08-06)", + "display_name": "GPT-4o (2024-08-06)", "modalities": { "input": [ "text", @@ -71557,56 +74365,30 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "knowledge": "2023-09", + "release_date": "2024-08-06", + "last_updated": "2024-08-06", "cost": { - "input": 0, - "output": 0 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1-Codex", - "display_name": "GPT-5.1-Codex", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", @@ -71624,16 +74406,16 @@ "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", + "minimal", "low", "medium", "high" @@ -71647,76 +74429,61 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" - } - ] - }, - "mixlayer": { - "id": "mixlayer", - "name": "Mixlayer", - "display_name": "Mixlayer", - "api": "https://models.mixlayer.ai/v1", - "doc": "https://docs.mixlayer.com", - "models": [ + }, { - "id": "qwen/qwen3.5-122b-a10b", - "name": "Qwen3.5 122B A10B", - "display_name": "Qwen3.5 122B A10B", + "id": "openai/gpt-5.3-chat-latest", + "name": "GPT-5.3 Chat (latest)", + "display_name": "GPT-5.3 Chat (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.4, - "output": 3.2 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "qwen/qwen3.5-27b", - "name": "Qwen3.5 27B", - "display_name": "Qwen3.5 27B", + "id": "kimi/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -71726,7 +74493,7 @@ "context": 262144, "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -71745,21 +74512,25 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.3, - "output": 2.4 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "qwen/qwen3.5-397b-a17b", - "name": "Qwen3.5 397B A17B", - "display_name": "Qwen3.5 397B A17B", + "id": "kimi/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -71786,20 +74557,22 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.6, - "output": 3.6 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "qwen/qwen3.5-9b", - "name": "Qwen3.5 9B", - "display_name": "Qwen3.5 9B", + "id": "minimax/minimax-m2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ "text" @@ -71809,8 +74582,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -71834,15 +74607,17 @@ "release_date": "2026-03-18", "last_updated": "2026-03-18", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "qwen/qwen3.5-35b-a3b", - "name": "Qwen3.5 35B A3B", - "display_name": "Qwen3.5 35B A3B", + "id": "minimax/minimax-m2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -71852,8 +74627,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -71863,68 +74638,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", - "cost": { - "input": 0.25, - "output": 1.3 - }, - "type": "chat" - } - ] - }, - "xiaomi-token-plan-sgp": { - "id": "xiaomi-token-plan-sgp", - "name": "Xiaomi Token Plan (Singapore)", - "display_name": "Xiaomi Token Plan (Singapore)", - "api": "https://token-plan-sgp.xiaomimimo.com/v1", - "doc": "https://platform.xiaomimimo.com/#/docs", - "models": [ - { - "id": "mimo-v2-tts", - "name": "MiMo-V2-TTS", - "display_name": "MiMo-V2-TTS", - "modalities": { - "input": [ - "text" - ], - "output": [ - "audio" - ] - }, - "limit": { - "context": 8192, - "output": 16384 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "mimo-v2-flash", - "name": "MiMo-V2-Flash", - "display_name": "MiMo-V2-Flash", + "id": "minimax/minimax-m2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ "text" @@ -71934,8 +74666,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -71956,20 +74688,20 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "mimo-v2-pro", - "name": "MiMo-V2-Pro", - "display_name": "MiMo-V2-Pro", + "id": "minimax/minimax-m2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "display_name": "MiniMax-M2.5-highspeed", "modalities": { "input": [ "text" @@ -71979,7 +74711,7 @@ ] }, "limit": { - "context": 1048576, + "context": 204800, "output": 131072 }, "temperature": true, @@ -71990,95 +74722,92 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": true, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "mimo-v2.5", - "name": "MiMo-V2.5", - "display_name": "MiMo-V2.5", + "id": "anthropic/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", "image", - "audio", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "context_over_200k": { - "input": 0, - "output": 0, - "cache_read": 0 - } + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "mimo-v2-omni", - "name": "MiMo-V2-Omni", - "display_name": "MiMo-V2-Omni", + "id": "anthropic/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -72086,8 +74815,8 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -72095,97 +74824,90 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "mimo-v2.5-pro", - "name": "MiMo-V2.5-Pro", - "display_name": "MiMo-V2.5-Pro", + "id": "anthropic/claude-opus-4.6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "context_over_200k": { - "input": 0, - "output": 0, - "cache_read": 0 - } + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" - } - ] - }, - "zai": { - "id": "zai", - "name": "Z.AI", - "display_name": "Z.AI", - "api": "https://api.z.ai/api/paas/v4", - "doc": "https://docs.z.ai/guides/overview/pricing", - "models": [ + }, { - "id": "glm-5v-turbo", - "name": "GLM-5V-Turbo", - "display_name": "GLM-5V-Turbo", + "id": "anthropic/claude-opus-4.1", + "name": "Claude Opus 4.1 (latest)", + "display_name": "Claude Opus 4.1 (latest)", "modalities": { "input": [ "text", "image", - "video", "pdf" ], "output": [ @@ -72194,7 +74916,7 @@ }, "limit": { "context": 200000, - "output": 131072 + "output": 32000 }, "temperature": true, "tool_call": true, @@ -72202,44 +74924,36 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24, - "cache_write": 0 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "anthropic/claude-opus-4", + "name": "Claude Opus 4 (latest)", + "display_name": "Claude Opus 4 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -72247,45 +74961,36 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "anthropic/claude-haiku-4.5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -72293,36 +74998,28 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { "input": 1, - "output": 3.2, - "cache_read": 0.2, - "cache_write": 0 + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "glm-4.7-flashx", - "name": "GLM-4.7-FlashX", - "display_name": "GLM-4.7-FlashX", + "id": "anthropic/claude-opus-4.5", + "name": "Claude Opus 4.5 (latest)", + "display_name": "Claude Opus 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -72330,7 +75027,7 @@ }, "limit": { "context": 200000, - "output": 131072 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -72338,26 +75035,28 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.07, - "output": 0.4, - "cache_read": 0.01, - "cache_write": 0 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4 (latest)", + "display_name": "Claude Sonnet 4 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -72365,7 +75064,7 @@ }, "limit": { "context": 200000, - "output": 131072 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -72373,79 +75072,97 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26, - "cache_write": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "anthropic/claude-opus-4.7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "qwen/qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -72453,34 +75170,47 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": true, + "open_weights": false, "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.2, - "output": 1.1, - "cache_read": 0.03, - "cache_write": 0 + "input": 0.115, + "output": 0.688, + "reasoning": 2.4 }, "type": "chat" }, { - "id": "glm-5-turbo", - "name": "GLM-5-Turbo", - "display_name": "GLM-5-Turbo", + "id": "qwen/qwen3.5-122b-a10b", + "name": "Qwen3.5 122B-A10B", + "display_name": "Qwen3.5 122B-A10B", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -72499,68 +75229,77 @@ ] } }, - "attachment": false, - "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "attachment": true, + "open_weights": true, + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24, - "cache_write": 0 + "input": 0.115, + "output": 0.917 }, "type": "chat" }, { - "id": "glm-4.5v", - "name": "GLM-4.5V", - "display_name": "GLM-4.5V", + "id": "qwen/qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, - "attachment": true, - "open_weights": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, "knowledge": "2025-04", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.6, - "output": 1.8 + "input": 0.359, + "output": 1.434 }, "type": "chat" }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "qwen/qwen3.5-397b-a17b", + "name": "Qwen3.5 397B-A17B", + "display_name": "Qwen3.5 397B-A17B", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -72570,26 +75309,29 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.172, + "output": 1.032 }, "type": "chat" }, { - "id": "glm-4.6v", - "name": "GLM-4.6V", - "display_name": "GLM-4.6V", + "id": "qwen/qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ "text", @@ -72601,8 +75343,8 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -72610,32 +75352,66 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 0.625, + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5 + }, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5, + "tier": { + "type": "context", + "size": 256000 + } + } + ] }, "type": "chat" }, { - "id": "glm-4.5-flash", - "name": "GLM-4.5-Flash", - "display_name": "GLM-4.5-Flash", + "id": "qwen/qwen3.5-35b-a3b", + "name": "Qwen3.5 35B-A3B", + "display_name": "Qwen3.5 35B-A3B", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -72643,34 +75419,45 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.057, + "output": 0.459 }, "type": "chat" }, { - "id": "glm-4.7-flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "qwen/qwen3.6-35b-a3b", + "name": "Qwen3.6 35B-A3B", + "display_name": "Qwen3.6 35B-A3B", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -72680,46 +75467,43 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.248, + "output": 1.485 }, "type": "chat" - } - ] - }, - "opencode": { - "id": "opencode", - "name": "OpenCode Zen", - "display_name": "OpenCode Zen", - "api": "https://opencode.ai/zen/v1", - "doc": "https://opencode.ai/docs/zen", - "models": [ + }, { - "id": "minimax-m2.7", - "name": "MiniMax M2.7", - "display_name": "MiniMax M2.7", + "id": "qwen/qwen3.5-27b", + "name": "Qwen3.5 27B", + "display_name": "Qwen3.5 27B", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -72738,91 +75522,71 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.086, + "output": 0.688 }, "type": "chat" }, { - "id": "gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "google/gemini-flash-latest", + "name": "Gemini Flash Latest", + "display_name": "Gemini Flash Latest", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.5, + "output": 3, + "cache_read": 0.075, + "input_audio": 1 }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "google/gemma-4-26b-a4b-it", + "name": "Gemma 4 26B", + "display_name": "Gemma 4 26B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -72830,40 +75594,34 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.06, + "output": 0.33 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", "image", - "video" + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1048576, "output": 65536 }, "temperature": true, @@ -72875,41 +75633,66 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.08 + "input": 2.5, + "output": 15, + "cache_read": 0.125, + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + }, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "google/gemma-4-31b-it", + "name": "Gemma 4 31B", + "display_name": "Gemma 4 31B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -72917,89 +75700,93 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.1 + "input": 0.13, + "output": 0.38 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "google/gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 0.1, + "output": 0.4, + "cache_read": 0.01, + "input_audio": 0.3 }, "type": "chat" }, { - "id": "glm-4.7-free", - "name": "GLM-4.7 Free", - "display_name": "GLM-4.7 Free", + "id": "google/gemini-flash-lite-latest", + "name": "Gemini Flash-Lite Latest", + "display_name": "Gemini Flash-Lite Latest", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -73007,33 +75794,22 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "gemini-3.1-pro", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "google/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ "text", @@ -73047,8 +75823,8 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -73076,28 +75852,41 @@ "attachment": true, "open_weights": false, "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 2, - "output": 12, + "input": 4, + "output": 18, "cache_read": 0.2, "context_over_200k": { "input": 4, "output": 18, "cache_read": 0.4 - } + }, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "google/gemini-3.1-pro-preview-customtools", + "name": "Gemini 3.1 Pro Preview Custom Tools", + "display_name": "Gemini 3.1 Pro Preview Custom Tools", "modalities": { "input": [ "text", "image", + "video", + "audio", "pdf" ], "output": [ @@ -73105,71 +75894,79 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ "low", - "medium", "high" ], - "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 4, + "output": 18, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "kimi-k2.5-free", - "name": "Kimi K2.5 Free", - "display_name": "Kimi K2.5 Free", + "id": "google/gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ "text", "image", - "video" + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -73179,35 +75976,32 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "google/gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ "text", "image", + "video", + "audio", "pdf" ], "output": [ @@ -73215,70 +76009,81 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" ], - "interleaved": true, "summaries": true, + "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 4, + "output": 18, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "google/gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -73288,43 +76093,44 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ + "mode": "level", + "level": "high", + "level_options": [ "minimal", "low", "medium", "high" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "input_audio": 1 }, "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -73332,10 +76138,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -73345,39 +76151,39 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 }, "type": "chat" }, { - "id": "minimax-m2.5-free", - "name": "MiniMax M2.5 Free", - "display_name": "MiniMax M2.5 Free", + "id": "deepseek/deepseek-chat", + "name": "DeepSeek Chat", + "display_name": "DeepSeek Chat", "modalities": { "input": [ "text" @@ -73387,36 +76193,30 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2025-09", + "release_date": "2025-12-01", + "last_updated": "2026-02-28", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "ring-2.6-1t-free", - "name": "Ring 2.6 1T Free", - "display_name": "Ring 2.6 1T Free", + "id": "deepseek/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -73426,8 +76226,8 @@ ] }, "limit": { - "context": 262000, - "output": 66000 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -73448,76 +76248,65 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-05-08", - "last_updated": "2026-05-08", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0, - "output": 0 + "input": 0.56, + "output": 1.12, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "deepseek/deepseek-reasoner", + "name": "DeepSeek Reasoner", + "display_name": "DeepSeek Reasoner", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 384000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2025-12-01", + "last_updated": "2026-02-28", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.435, + "output": 0.87, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "deepseek-v4-flash-free", - "name": "DeepSeek V4 Flash Free", - "display_name": "DeepSeek V4 Flash Free", + "id": "deepseek/deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -73553,27 +76342,38 @@ "release_date": "2026-04-24", "last_updated": "2026-04-24", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.19, + "output": 0.37, + "cache_read": 0.028 }, "type": "chat" - }, + } + ] + }, + "opencode-go": { + "id": "opencode-go", + "name": "OpenCode Go", + "display_name": "OpenCode Go", + "api": "https://opencode.ai/zen/go/v1", + "doc": "https://opencode.ai/docs/zen", + "models": [ { - "id": "big-pickle", - "name": "Big Pickle", - "display_name": "Big Pickle", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -73592,36 +76392,35 @@ ] } }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-10-17", - "last_updated": "2025-10-17", + "attachment": true, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "claude-opus-4-1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -73631,39 +76430,43 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.2, + "output": 1.2, + "cache_read": 0.02, + "cache_write": 0.25 }, "type": "chat" }, { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 202752, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -73682,27 +76485,27 @@ ] } }, - "attachment": true, - "open_weights": false, + "attachment": false, + "open_weights": true, "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "cache_write": 0.625 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 Mini", - "display_name": "GPT-5.4 Mini", + "id": "mimo-v2-omni", + "name": "MiMo V2 Omni", + "display_name": "MiMo V2 Omni", "modalities": { "input": [ "text", "image", + "audio", "pdf" ], "output": [ @@ -73710,89 +76513,42 @@ ] }, "limit": { - "context": 400000, + "context": 262144, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", - "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 - }, - "type": "chat" - }, - { - "id": "claude-3-5-haiku", - "name": "Claude Haiku 3.5", - "display_name": "Claude Haiku 3.5", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 0.4, + "output": 2, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "minimax-m2.1", - "name": "MiniMax M2.1", - "display_name": "MiniMax M2.1", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -73802,8 +76558,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -73824,20 +76580,20 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.1 + "input": 1.74, + "output": 3.48, + "cache_read": 0.0145 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "mimo-v2.5-pro", + "name": "MiMo V2.5 Pro", + "display_name": "MiMo V2.5 Pro", "modalities": { "input": [ "text" @@ -73847,8 +76603,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1048576, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -73867,95 +76623,90 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-04-07", - "last_updated": "2026-04-07", + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 1, + "output": 3, + "cache_read": 0.2, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "gpt-5.4-nano", - "name": "GPT-5.4 Nano", - "display_name": "GPT-5.4 Nano", + "id": "minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 204800, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "minimax-m2.7", + "name": "MiniMax M2.7", + "display_name": "MiniMax M2.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -73964,146 +76715,81 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex Mini", - "display_name": "GPT-5.1 Codex Mini", + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 0.625 }, "type": "chat" }, { - "id": "claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "mimo-v2-pro", + "name": "MiMo V2 Pro", + "display_name": "MiMo V2 Pro", "modalities": { "input": [ - "text", - "image", - "pdf" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 1000000, - "output": 64000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5 - } - }, - "type": "chat" - }, - { - "id": "gemini-3-flash", - "name": "Gemini 3 Flash", - "display_name": "Gemini 3 Flash", - "modalities": { - "input": [ - "text", - "image", - "video", - "audio", - "pdf" ], "output": [ "text" @@ -74111,7 +76797,7 @@ }, "limit": { "context": 1048576, - "output": 65536 + "output": 128000 }, "temperature": true, "tool_call": true, @@ -74122,141 +76808,123 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.5, + "input": 1, "output": 3, - "cache_read": 0.05 - }, - "type": "chat" - }, - { - "id": "trinity-large-preview-free", - "name": "Trinity Large Preview", - "display_name": "Trinity Large Preview", - "modalities": { - "input": [ - "text" + "cache_read": 0.2, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131072 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-01-28", - "last_updated": "2026-01-28", - "cost": { - "input": 0, - "output": 0 + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "mimo-v2.5", + "name": "MiMo V2.5", + "display_name": "MiMo V2.5", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 1.07, - "output": 8.5, - "cache_read": 0.107 + "input": 0.4, + "output": 2, + "cache_read": 0.08, + "tiers": [ + { + "input": 0.8, + "output": 4, + "cache_read": 0.16, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 0.8, + "output": 4, + "cache_read": 0.16 + } }, "type": "chat" }, { - "id": "gpt-5.4-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 1000000, + "output": 384000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -74265,39 +76933,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 30, - "output": 180, - "cache_read": 30 + "input": 0.14, + "output": 0.28, + "cache_read": 0.0028 }, "type": "chat" }, { - "id": "glm-5-free", - "name": "GLM-5 Free", - "display_name": "GLM-5 Free", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -74307,8 +76966,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 202752, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -74333,29 +76992,29 @@ "release_date": "2026-02-11", "last_updated": "2026-02-11", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -74365,26 +77024,40 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" - }, + } + ] + }, + "llmgateway": { + "id": "llmgateway", + "name": "LLM Gateway", + "display_name": "LLM Gateway", + "api": "https://api.llmgateway.io/v1", + "doc": "https://llmgateway.io/docs", + "models": [ { - "id": "minimax-m2.1-free", - "name": "MiniMax M2.1 Free", - "display_name": "MiniMax M2.1 Free", + "id": "gemma-2-27b-it-together", + "name": "Gemma 2 27B IT", + "display_name": "Gemma 2 27B IT", "modalities": { "input": [ "text" @@ -74394,36 +77067,28 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 8192, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "release_date": "2024-06-27", + "last_updated": "2024-06-27", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.08, + "output": 0.08 }, "type": "chat" }, { - "id": "qwen3.6-plus-free", - "name": "Qwen3.6 Plus Free", - "display_name": "Qwen3.6 Plus Free", + "id": "qwen3-30b-a3b-instruct-2507", + "name": "Qwen3 30B A3B Instruct (2507)", + "display_name": "Qwen3 30B A3B Instruct (2507)", "modalities": { "input": [ "text" @@ -74433,42 +77098,28 @@ ] }, "limit": { - "context": 1048576, - "output": 64000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-30", - "last_updated": "2026-03-30", + "open_weights": true, + "release_date": "2025-07-08", + "last_updated": "2025-07-08", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "claude-3-7-sonnet", + "name": "Claude 3.7 Sonnet", + "display_name": "Claude 3.7 Sonnet", "modalities": { "input": [ "text" @@ -74478,83 +77129,94 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "open_weights": false, + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.1 + "input": 3, + "output": 15, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "ling-2.6-flash-free", - "name": "Ling 2.6 Flash Free", - "display_name": "Ling 2.6 Flash Free", + "id": "qwen3-vl-235b-a22b-instruct", + "name": "Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen3 VL 235B A22B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262100, - "output": 32800 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0, - "output": 0 + "input": 0.8, + "output": 2.4 }, "type": "chat" }, { - "id": "gemini-3-pro", - "name": "Gemini 3 Pro", - "display_name": "Gemini 3 Pro", + "id": "seed-1-6-250615", + "name": "Seed 1.6 (250615)", + "display_name": "Seed 1.6 (250615)", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -74562,57 +77224,65 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "attachment": true, + "open_weights": true, + "release_date": "2025-06-25", + "last_updated": "2025-06-25", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.05 + }, + "type": "chat" + }, + { + "id": "gpt-4o-mini-search-preview", + "name": "GPT-4o Mini Search Preview", + "display_name": "GPT-4o Mini Search Preview", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "seed-1-6-flash-250715", + "name": "Seed 1.6 Flash (250715)", + "display_name": "Seed 1.6 Flash (250715)", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -74620,33 +77290,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.07, + "output": 0.3, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "gpt-5-codex", - "name": "GPT-5 Codex", - "display_name": "GPT-5 Codex", + "id": "qwen2-5-vl-32b-instruct", + "name": "Qwen2.5 VL 32B Instruct", + "display_name": "Qwen2.5 VL 32B Instruct", "modalities": { "input": [ "text", @@ -74657,86 +77315,60 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "open_weights": true, + "release_date": "2025-03-15", + "last_updated": "2025-03-15", "cost": { - "input": 1.07, - "output": 8.5, - "cache_read": 0.107 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "grok-code", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "gemma-3-27b", + "name": "Gemma 3 27B", + "display_name": "Gemma 3 27B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-08-20", - "last_updated": "2025-08-20", + "open_weights": true, + "release_date": "2025-03-12", + "last_updated": "2025-03-12", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.27, + "output": 0.27 }, "type": "chat" }, { - "id": "mimo-v2-flash-free", - "name": "MiMo V2 Flash Free", - "display_name": "MiMo V2 Flash Free", + "id": "llama-3.1-70b-instruct", + "name": "Llama 3.1 70B Instruct", + "display_name": "Llama 3.1 70B Instruct", "modalities": { "input": [ "text" @@ -74746,8 +77378,40 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 2048 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0.72, + "output": 0.72 + }, + "type": "chat" + }, + { + "id": "qwen3-vl-235b-a22b-thinking", + "name": "Qwen3 VL 235B A22B Thinking", + "display_name": "Qwen3 VL 235B A22B Thinking", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -74766,35 +77430,34 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.8, + "output": 2.4 }, "type": "chat" }, { - "id": "gpt-5.3-codex-spark", - "name": "GPT-5.3 Codex Spark", - "display_name": "GPT-5.3 Codex Spark", + "id": "grok-4-1-fast-reasoning", + "name": "Grok 4.1 Fast Reasoning", + "display_name": "Grok 4.1 Fast Reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 2000000, + "output": 30000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -74802,44 +77465,28 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "hy3-preview-free", - "name": "Hy3 preview Free", - "display_name": "Hy3 preview Free", + "id": "seed-1-6-250915", + "name": "Seed 1.6 (250915)", + "display_name": "Seed 1.6 (250915)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -74847,7 +77494,7 @@ }, "limit": { "context": 256000, - "output": 64000 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -74855,22 +77502,21 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-04-20", - "last_updated": "2026-04-20", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.25, + "output": 2, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "deepseek-r1-0528", + "name": "DeepSeek R1 (0528)", + "display_name": "DeepSeek R1 (0528)", "modalities": { "input": [ "text" @@ -74880,11 +77526,11 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 64000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -74902,20 +77548,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.8, + "output": 2.4 }, "type": "chat" }, { - "id": "kimi-k2", - "name": "Kimi K2", - "display_name": "Kimi K2", + "id": "codestral-2508", + "name": "Codestral", + "display_name": "Codestral", "modalities": { "input": [ "text" @@ -74925,35 +77569,32 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { - "input": 0.4, - "output": 2.5, - "cache_read": 0.4 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "qwen3-vl-flash", + "name": "Qwen3 VL Flash", + "display_name": "Qwen3 VL Flash", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -74961,75 +77602,72 @@ }, "limit": { "context": 1000000, - "output": 64000 + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-10-09", + "last_updated": "2025-10-09", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5 - } + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "qwen3-coder", - "name": "Qwen3 Coder", - "display_name": "Qwen3 Coder", + "id": "glm-4.6v-flash", + "name": "GLM-4.6V Flash", + "display_name": "GLM-4.6V Flash", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 16000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.45, - "output": 1.8 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text", @@ -75040,10 +77678,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 163840, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -75051,53 +77689,35 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 1.07, - "output": 8.5, - "cache_read": 0.107 + "input": 0.28, + "output": 0.42, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "qwen3.5-plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "gemini-pro-latest", + "name": "Gemini Pro Latest", + "display_name": "Gemini Pro Latest", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1048576, "output": 65536 }, "temperature": true, @@ -75106,34 +77726,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "release_date": "2026-02-27", + "last_updated": "2026-02-27", "cost": { - "input": 0.2, - "output": 1.2, - "cache_read": 0.02, - "cache_write": 0.25 + "input": 2, + "output": 12, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "mimo-v2-pro-free", - "name": "MiMo V2 Pro Free", - "display_name": "MiMo V2 Pro Free", + "id": "qwen3-30b-a3b-fp8", + "name": "Qwen3 30B A3B FP8", + "display_name": "Qwen3 30B A3B FP8", "modalities": { "input": [ "text" @@ -75143,8 +77750,8 @@ ] }, "limit": { - "context": 1048576, - "output": 64000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -75152,33 +77759,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "nemotron-3-super-free", - "name": "Nemotron 3 Super Free", - "display_name": "Nemotron 3 Super Free", + "id": "qwen-coder-plus", + "name": "Qwen Coder Plus", + "display_name": "Qwen Coder Plus", "modalities": { "input": [ "text" @@ -75188,78 +77782,60 @@ ] }, "limit": { - "context": 204800, - "output": 128000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2026-02", - "release_date": "2026-03-11", - "last_updated": "2026-03-11", + "open_weights": false, + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.5, + "output": 1 }, "type": "chat" }, { - "id": "gpt-5.5-pro", - "name": "GPT-5.5 Pro", - "display_name": "GPT-5.5 Pro", + "id": "minimax-m2.1-lightning", + "name": "MiniMax M2.1 Lightning", + "display_name": "MiniMax M2.1 Lightning", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 196608, + "output": 131072 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 30, - "output": 180, - "cache_read": 30 + "input": 0.12, + "output": 0.48 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "llama-3.1-nemotron-ultra-253b", + "name": "Llama 3.1 Nemotron Ultra 253B", + "display_name": "Llama 3.1 Nemotron Ultra 253B", "modalities": { "input": [ "text" @@ -75269,42 +77845,28 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "release_date": "2025-04-07", + "last_updated": "2025-04-07", "cost": { - "input": 0.4, - "output": 2.5, - "cache_read": 0.4 + "input": 0.6, + "output": 1.8 }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "qwen-max-latest", + "name": "Qwen Max Latest", + "display_name": "Qwen Max Latest", "modalities": { "input": [ "text", @@ -75315,297 +77877,186 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32768, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-01-25", + "last_updated": "2025-01-25", "cost": { - "input": 1.07, - "output": 8.5, - "cache_read": 0.107 + "input": 1.6, + "output": 6.4 }, "type": "chat" }, { - "id": "mimo-v2-omni-free", - "name": "MiMo V2 Omni Free", - "display_name": "MiMo V2 Omni Free", + "id": "glm-4.5-airx", + "name": "GLM-4.5 AirX", + "display_name": "GLM-4.5 AirX", "modalities": { "input": [ - "text", - "image", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 64000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": false, + "open_weights": false, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "cost": { + "input": 1.1, + "output": 4.5, + "cache_read": 0.22 }, - "attachment": true, + "type": "chat" + }, + { + "id": "llama-3.2-11b-instruct", + "name": "Llama 3.2 11B Instruct", + "display_name": "Llama 3.2 11B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.07, + "output": 0.33 }, "type": "chat" }, { - "id": "gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "grok-4-0709", + "name": "Grok 4 (0709)", + "display_name": "Grok 4 (0709)", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 256000, + "output": 256000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "ministral-14b-2512", + "name": "Ministral 14B", + "display_name": "Ministral 14B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 262144, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "open_weights": true, + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "gpt-4o-search-preview", + "name": "GPT-4o Search Preview", + "display_name": "GPT-4o Search Preview", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 2.5, + "output": 10 }, "type": "chat" - } - ] - }, - "stepfun": { - "id": "stepfun", - "name": "StepFun", - "display_name": "StepFun", - "api": "https://api.stepfun.com/v1", - "doc": "https://platform.stepfun.com/docs/zh/overview/concept", - "models": [ + }, { - "id": "step-3.5-flash-2603", - "name": "Step 3.5 Flash 2603", - "display_name": "Step 3.5 Flash 2603", + "id": "gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -75615,8 +78066,8 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 131072, + "output": 32766 }, "temperature": true, "tool_call": true, @@ -75624,22 +78075,25 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { "input": 0.1, - "output": 0.3, - "cache_read": 0.02 + "output": 0.5 }, "type": "chat" }, { - "id": "step-1-32k", - "name": "Step 1 (32K)", - "display_name": "Step 1 (32K)", + "id": "qwen3-coder-next", + "name": "Qwen3 Coder Next", + "display_name": "Qwen3 Coder Next", "modalities": { "input": [ "text" @@ -75649,8 +78103,8 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -75660,20 +78114,18 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-01-01", - "last_updated": "2026-02-13", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 2.05, - "output": 9.59, - "cache_read": 0.41 + "input": 0.8, + "output": 4 }, "type": "chat" }, { - "id": "step-3.5-flash", - "name": "Step 3.5 Flash", - "display_name": "Step 3.5 Flash", + "id": "qwen3-30b-a3b-thinking-2507", + "name": "Qwen3 30B A3B Thinking (2507)", + "display_name": "Qwen3 30B A3B Thinking (2507)", "modalities": { "input": [ "text" @@ -75683,8 +78135,8 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -75692,22 +78144,31 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-29", - "last_updated": "2026-02-13", + "release_date": "2025-07-08", + "last_updated": "2025-07-08", "cost": { - "input": 0.096, - "output": 0.288, - "cache_read": 0.019 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "step-2-16k", - "name": "Step 2 (16K)", - "display_name": "Step 2 (16K)", + "id": "llama-4-scout", + "name": "Llama 4 Scout", + "display_name": "Llama 4 Scout", "modalities": { "input": [ "text" @@ -75717,40 +78178,60 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-01-01", - "last_updated": "2026-02-13", + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 5.21, - "output": 16.44, - "cache_read": 1.04 + "input": 0.18, + "output": 0.59 }, "type": "chat" - } - ] - }, - "nebius": { - "id": "nebius", - "name": "Nebius Token Factory", - "display_name": "Nebius Token Factory", - "api": "https://api.tokenfactory.nebius.com/v1", - "doc": "https://docs.tokenfactory.nebius.com/", - "models": [ + }, { - "id": "NousResearch/Hermes-4-70B", - "name": "Hermes-4-70B", - "display_name": "Hermes-4-70B", + "id": "ministral-3b-2512", + "name": "Ministral 3B", + "display_name": "Ministral 3B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-12-02", + "last_updated": "2025-12-02", + "cost": { + "input": 0.1, + "output": 0.1 + }, + "type": "chat" + }, + { + "id": "qwen3-4b-fp8", + "name": "Qwen3 4B FP8", + "display_name": "Qwen3 4B FP8", "modalities": { "input": [ "text" @@ -75760,7 +78241,7 @@ ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, "temperature": true, @@ -75769,35 +78250,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-11", - "release_date": "2026-01-30", - "last_updated": "2026-02-04", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 0.13, - "output": 0.4, - "reasoning": 0.4, - "cache_read": 0.013, - "cache_write": 0.16 + "input": 0.03, + "output": 0.05 }, "type": "chat" }, { - "id": "NousResearch/Hermes-4-405B", - "name": "Hermes-4-405B", - "display_name": "Hermes-4-405B", + "id": "qwen3-235b-a22b-fp8", + "name": "Qwen3 235B A22B FP8", + "display_name": "Qwen3 235B A22B FP8", "modalities": { "input": [ "text" @@ -75807,7 +78273,7 @@ ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, "temperature": true, @@ -75816,80 +78282,62 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-11", - "release_date": "2026-01-30", - "last_updated": "2026-02-04", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 1, - "output": 3, - "reasoning": 3, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.5, + "output": 2.5 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-72B-Instruct", - "name": "Qwen2.5-VL-72B-Instruct", - "display_name": "Qwen2.5-VL-72B-Instruct", + "id": "qwen25-coder-7b", + "name": "Qwen2.5 Coder 7B", + "display_name": "Qwen2.5 Coder 7B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-20", - "last_updated": "2026-02-04", + "release_date": "2024-09-19", + "last_updated": "2024-09-19", "cost": { - "input": 0.25, - "output": 0.75, - "cache_read": 0.025, - "cache_write": 0.31 + "input": 0.05, + "output": 0.05 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-397B-A17B", - "name": "Qwen3.5-397B-A17B", - "display_name": "Qwen3.5-397B-A17B", + "id": "qwen3-vl-30b-a3b-thinking", + "name": "Qwen3 VL 30B A3B Thinking", + "display_name": "Qwen3 VL 30B A3B Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 131072, "output": 8192 }, "temperature": true, @@ -75909,55 +78357,86 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-15", - "last_updated": "2026-05-07", + "release_date": "2025-10-02", + "last_updated": "2025-10-02", "cost": { - "input": 0.6, - "output": 3.6, - "cache_read": 0.06, - "cache_write": 0.75 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Embedding-8B", - "name": "Qwen3-Embedding-8B", - "display_name": "Qwen3-Embedding-8B", + "id": "deepseek-v3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ + "text", + "image" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "cost": { + "input": 0.56, + "output": 1.68, + "cache_read": 0.11 + }, + "type": "chat" + }, + { + "id": "llama-4-scout-17b-instruct", + "name": "Llama 4 Scout 17B Instruct", + "display_name": "Llama 4 Scout 17B Instruct", + "modalities": { + "input": [ + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 8192, + "output": 2048 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-10", - "release_date": "2026-01-10", - "last_updated": "2026-02-04", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.01, - "output": 0 + "input": 0.17, + "output": 0.66 }, - "type": "embedding" + "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen3-30B-A3B-Instruct-2507", - "display_name": "Qwen3-30B-A3B-Instruct-2507", + "id": "qwen3-32b-fp8", + "name": "Qwen3 32B FP8", + "display_name": "Qwen3 32B FP8", "modalities": { "input": [ "text" @@ -75967,64 +78446,62 @@ ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-01-28", - "last_updated": "2026-02-04", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { "input": 0.1, - "output": 0.3, - "cache_read": 0.01, - "cache_write": 0.125 + "output": 0.1 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "claude-3-opus", + "name": "Claude 3 Opus", + "display_name": "Claude 3 Opus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 8192 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-25", - "last_updated": "2025-10-04", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", "cost": { - "input": 0.2, - "output": 0.6 + "input": 15, + "output": 75, + "cache_read": 1.5 }, "type": "chat" }, { - "id": "Qwen/Qwen3-32B", - "name": "Qwen3-32B", - "display_name": "Qwen3-32B", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct (2507)", + "display_name": "Qwen3 235B A22B Instruct (2507)", "modalities": { "input": [ "text" @@ -76034,88 +78511,60 @@ ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-01-28", - "last_updated": "2026-02-04", + "release_date": "2025-07-08", + "last_updated": "2025-07-08", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01, - "cache_write": 0.125 + "input": 0.8, + "output": 2.4 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507-fast", - "name": "Qwen3-235B-A22B-Thinking-2507-fast", - "display_name": "Qwen3-235B-A22B-Thinking-2507-fast", + "id": "custom", + "name": "Custom Model", + "display_name": "Custom Model", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8000, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-25", - "last_updated": "2026-05-07", + "attachment": true, + "open_weights": false, + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 0.5, - "output": 2, - "cache_read": 0.05, - "cache_write": 0.625 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-397B-A17B-fast", - "name": "Qwen3.5-397B-A17B-fast", - "display_name": "Qwen3.5-397B-A17B-fast", + "id": "llama-3-70b-instruct", + "name": "Llama 3 70B Instruct", + "display_name": "Llama 3 70B Instruct", "modalities": { "input": [ "text" @@ -76125,89 +78574,60 @@ ] }, "limit": { - "context": 8000, - "output": 8192 + "context": 8192, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-15", - "last_updated": "2026-05-07", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 0.6, - "output": 3.6, - "cache_read": 0.06, - "cache_write": 0.75 + "input": 0.51, + "output": 0.74 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Thinking-fast", - "name": "Qwen3-Next-80B-A3B-Thinking-fast", - "display_name": "Qwen3-Next-80B-A3B-Thinking-fast", + "id": "qwen3-vl-8b-instruct", + "name": "Qwen3 VL 8B Instruct", + "display_name": "Qwen3 VL 8B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8000, + "context": 131072, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-25", - "last_updated": "2026-05-07", + "release_date": "2025-08-19", + "last_updated": "2025-08-19", "cost": { - "input": 0.15, - "output": 1.2, - "cache_read": 0.015, - "cache_write": 0.1875 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "name": "Qwen3-Next-80B-A3B-Thinking", - "display_name": "Qwen3-Next-80B-A3B-Thinking", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22B Thinking (2507)", + "display_name": "Qwen3 235B A22B Thinking (2507)", "modalities": { "input": [ "text" @@ -76217,8 +78637,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -76239,22 +78659,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-01-28", - "last_updated": "2026-02-04", + "release_date": "2025-07-08", + "last_updated": "2025-07-08", "cost": { - "input": 0.15, - "output": 1.2, - "reasoning": 1.2, - "cache_read": 0.015, - "cache_write": 0.18 + "input": 0.8, + "output": 2.4 }, "type": "chat" }, { - "id": "PrimeIntellect/INTELLECT-3", - "name": "INTELLECT-3", - "display_name": "INTELLECT-3", + "id": "kimi-k2", + "name": "Kimi K2", + "display_name": "Kimi K2", "modalities": { "input": [ "text" @@ -76264,8 +78680,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -76274,21 +78690,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-10", - "release_date": "2026-01-25", - "last_updated": "2026-02-04", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", "cost": { - "input": 0.2, - "output": 1.1, - "cache_read": 0.02, - "cache_write": 0.25 + "input": 1, + "output": 3, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "zai-org/GLM-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "claude-3-5-haiku", + "name": "Claude 3.5 Haiku", + "display_name": "Claude 3.5 Haiku", "modalities": { "input": [ "text" @@ -76299,42 +78713,28 @@ }, "limit": { "context": 200000, - "output": 16384 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2026-01", - "release_date": "2026-03-01", - "last_updated": "2026-03-10", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.1, - "cache_write": 1 + "input": 0.8, + "output": 4, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "llama-3-8b-instruct", + "name": "Llama 3 8B Instruct", + "display_name": "Llama 3 8B Instruct", "modalities": { "input": [ "text" @@ -76344,31 +78744,28 @@ ] }, "limit": { - "context": 128000, + "context": 8192, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-12-05", - "last_updated": "2026-02-04", + "release_date": "2025-04-03", + "last_updated": "2025-04-03", "cost": { - "input": 0.13, - "output": 0.4, - "cache_read": 0.013, - "cache_write": 0.16 + "input": 0.04, + "output": 0.04 }, "type": "chat" }, { - "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", + "id": "gemma-3-1b-it", + "name": "Gemma 3 1B IT", + "display_name": "Gemma 3 1B IT", "modalities": { "input": [ "text" @@ -76378,34 +78775,32 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2024-07-23", - "last_updated": "2026-02-04", + "release_date": "2025-03-12", + "last_updated": "2025-03-12", "cost": { - "input": 0.02, - "output": 0.06, - "cache_read": 0.002, - "cache_write": 0.025 + "input": 0.08, + "output": 0.3 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-super-120b-a12b", - "name": "Nemotron-3-Super-120B-A12B", - "display_name": "Nemotron-3-Super-120B-A12B", + "id": "qwen3-max-2026-01-23", + "name": "Qwen3 Max (2026-01-23)", + "display_name": "Qwen3 Max (2026-01-23)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -76413,7 +78808,7 @@ }, "limit": { "context": 256000, - "output": 32768 + "output": 32800 }, "temperature": true, "tool_call": true, @@ -76421,24 +78816,36 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2026-02", - "release_date": "2026-03-11", - "last_updated": "2026-03-12", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-01-23", + "last_updated": "2026-01-23", "cost": { - "input": 0.3, - "output": 0.9 + "input": 3, + "output": 15, + "cache_read": 0.6 }, "type": "chat" }, { - "id": "nvidia/Llama-3_1-Nemotron-Ultra-253B-v1", - "name": "Llama-3.1-Nemotron-Ultra-253B-v1", - "display_name": "Llama-3.1-Nemotron-Ultra-253B-v1", + "id": "glm-4.6v-flashx", + "name": "GLM-4.6V FlashX", + "display_name": "GLM-4.6V FlashX", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -76446,30 +78853,29 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 16000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-15", - "last_updated": "2026-02-04", + "attachment": true, + "open_weights": false, + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.6, - "output": 1.8, - "cache_read": 0.06, - "cache_write": 0.75 + "input": 0.04, + "output": 0.4, + "cache_read": 0 }, "type": "chat" }, { - "id": "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B", - "name": "Nemotron-3-Nano-30B-A3B", - "display_name": "Nemotron-3-Nano-30B-A3B", + "id": "minimax-text-01", + "name": "MiniMax Text 01", + "display_name": "MiniMax Text 01", "modalities": { "input": [ "text" @@ -76479,31 +78885,29 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 1000000, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-08-10", - "last_updated": "2026-02-04", + "release_date": "2025-01-15", + "last_updated": "2025-01-15", "cost": { - "input": 0.06, - "output": 0.24, - "cache_read": 0.006, - "cache_write": 0.075 + "input": 0.2, + "output": 1.1 }, "type": "chat" }, { - "id": "nvidia/Nemotron-3-Nano-Omni", - "name": "Nemotron-3-Nano-Omni", - "display_name": "Nemotron-3-Nano-Omni", + "id": "llama-3.2-3b-instruct", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ "text" @@ -76513,32 +78917,28 @@ ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 32768, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01-20", - "last_updated": "2026-05-07", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 0.06, - "output": 0.24, - "cache_read": 0.006, - "cache_write": 0.075 + "input": 0.03, + "output": 0.05 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2-fast", - "name": "DeepSeek-V3.2-fast", - "display_name": "DeepSeek-V3.2-fast", + "id": "gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -76548,8 +78948,8 @@ ] }, "limit": { - "context": 8000, - "output": 8192 + "context": 131072, + "output": 32766 }, "temperature": true, "tool_call": true, @@ -76557,23 +78957,25 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2026-05-07", + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.04, - "cache_write": 0.5 + "input": 0.15, + "output": 0.75 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "hermes-2-pro-llama-3-8b", + "name": "Hermes 2 Pro Llama 3 8B", + "display_name": "Hermes 2 Pro Llama 3 8B", "modalities": { "input": [ "text" @@ -76583,89 +78985,71 @@ ] }, "limit": { - "context": 163000, - "output": 16384 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-11", - "release_date": "2026-01-20", - "last_updated": "2026-02-04", + "release_date": "2024-05-27", + "last_updated": "2024-05-27", "cost": { - "input": 0.3, - "output": 0.45, - "reasoning": 0.45, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 0.14, + "output": 0.14 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b-fast", - "name": "gpt-oss-120b-fast", - "display_name": "gpt-oss-120b-fast", + "id": "ministral-8b-2512", + "name": "Ministral 8B", + "display_name": "Ministral 8B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8000, + "context": 262144, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-06-10", - "last_updated": "2026-05-07", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0.1, - "output": 0.5, - "cache_read": 0.01, - "cache_write": 0.125 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "seed-1-8-251228", + "name": "Seed 1.8 (251228)", + "display_name": "Seed 1.8 (251228)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 256000, "output": 8192 }, "temperature": true, @@ -76674,69 +79058,53 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-09", - "release_date": "2026-01-10", - "last_updated": "2026-02-04", + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "cost": { - "input": 0.15, - "output": 0.6, - "reasoning": 0.6, - "cache_read": 0.015, - "cache_write": 0.18 + "input": 0.25, + "output": 2, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "google/gemma-2-2b-it", - "name": "Gemma-2-2b-it", - "display_name": "Gemma-2-2b-it", + "id": "qwen3-vl-30b-a3b-instruct", + "name": "Qwen3 VL 30B A3B Instruct", + "display_name": "Qwen3 VL 30B A3B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-06", - "release_date": "2024-07-31", - "last_updated": "2026-02-04", + "release_date": "2025-10-02", + "last_updated": "2025-10-02", "cost": { - "input": 0.02, - "output": 0.06, - "cache_read": 0.002, - "cache_write": 0.025 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "google/gemma-3-27b-it", - "name": "Gemma-3-27b-it", - "display_name": "Gemma-3-27b-it", + "id": "llama-4-maverick-17b-instruct", + "name": "Llama 4 Maverick 17B Instruct", + "display_name": "Llama 4 Maverick 17B Instruct", "modalities": { "input": [ "text", @@ -76747,31 +79115,28 @@ ] }, "limit": { - "context": 110000, - "output": 8192 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": true, - "knowledge": "2025-10", - "release_date": "2026-01-20", - "last_updated": "2026-02-04", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01, - "cache_write": 0.125 + "input": 0.24, + "output": 0.97 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5-fast", - "name": "Kimi-K2.5-fast", - "display_name": "Kimi-K2.5-fast", + "id": "auto", + "name": "Auto Route", + "display_name": "Auto Route", "modalities": { "input": [ "text", @@ -76782,55 +79147,39 @@ ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-12-15", - "last_updated": "2026-02-04", + "open_weights": false, + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 0.5, - "output": 2.5, - "cache_read": 0.05, - "cache_write": 0.625 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi-K2.5", - "display_name": "Kimi-K2.5", + "id": "glm-4.5-x", + "name": "GLM-4.5 X", + "display_name": "GLM-4.5 X", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -76838,35 +79187,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-12-15", - "last_updated": "2026-02-04", + "attachment": false, + "open_weights": false, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.5, - "output": 2.5, - "reasoning": 2.5, - "cache_read": 0.05, - "cache_write": 0.625 + "input": 2.2, + "output": 8.9, + "cache_read": 0.45 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "glm-4-32b-0414-128k", + "name": "GLM-4 32B (0414-128k)", + "display_name": "GLM-4 32B (0414-128k)", "modalities": { "input": [ "text" @@ -76876,48 +79211,40 @@ ] }, "limit": { - "context": 196608, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01-20", - "last_updated": "2026-05-07", + "open_weights": false, + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5-fast", - "name": "MiniMax-M2.5-fast", - "display_name": "MiniMax-M2.5-fast", + "id": "grok-4-fast-reasoning", + "name": "Grok 4 Fast Reasoning", + "display_name": "Grok 4 Fast Reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8000, - "output": 8192 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -76925,40 +79252,43 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01-20", - "last_updated": "2026-05-07", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V4-Pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "qwen-plus-latest", + "name": "Qwen Plus Latest", + "display_name": "Qwen Plus Latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -76971,71 +79301,64 @@ ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "release_date": "2025-01-25", + "last_updated": "2025-01-25", "cost": { - "input": 1.75, - "output": 3.5, - "cache_read": 0.15 + "input": 0.3, + "output": 0.9 }, "type": "chat" - } - ] - }, - "poe": { - "id": "poe", - "name": "Poe", - "display_name": "Poe", - "api": "https://api.poe.com/v1", - "doc": "https://creator.poe.com/docs/external-applications/openai-compatible-api", - "models": [ + }, { - "id": "topazlabs-co/topazlabs", - "name": "TopazLabs", - "display_name": "TopazLabs", + "id": "llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 204, - "output": 8192 + "context": 128000, + "output": 2048 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0.22, + "output": 0.22 + }, "type": "chat" }, { - "id": "novita/kimi-k2.5", - "name": "Kimi-K2.5", - "display_name": "Kimi-K2.5", + "id": "claude-opus-4-1-20250805", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 262144 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -77043,115 +79366,89 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, "open_weights": false, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "novita/glm-4.7", - "name": "glm-4.7", - "display_name": "glm-4.7", + "id": "qwen2-5-vl-72b-instruct", + "name": "Qwen2.5-VL 72B Instruct", + "display_name": "Qwen2.5-VL 72B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 205000, - "output": 131072 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", + "cost": { + "input": 2.8, + "output": 8.4 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-22", - "last_updated": "2025-12-22", "type": "chat" }, { - "id": "novita/glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "mistral-large-2512", + "name": "Mistral Large 3", + "display_name": "Mistral Large 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 205000, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-02-15", - "last_updated": "2026-02-15", + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "novita/minimax-m2.1", - "name": "minimax-m2.1", - "display_name": "minimax-m2.1", + "id": "minimax-m2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -77161,10 +79458,10 @@ ] }, "limit": { - "context": 205000, + "context": 204800, "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -77175,48 +79472,20 @@ "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-26", - "last_updated": "2025-12-26", - "type": "chat" - }, - { - "id": "novita/glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "cost": { + "input": 0.3, + "output": 1.2 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", "type": "chat" }, { - "id": "novita/kimi-k2.6", - "name": "Kimi-K2.6", - "display_name": "Kimi-K2.6", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", @@ -77231,7 +79500,7 @@ "context": 262144, "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -77239,54 +79508,73 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-04-20", - "last_updated": "2026-05-02", + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.96, - "output": 4.04, - "cache_read": 0.16 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "novita/glm-4.6v", - "name": "glm-4.6v", - "display_name": "glm-4.6v", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 32768 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "cost": { + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + }, "type": "chat" }, { - "id": "novita/deepseek-v3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "minimax-m2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ "text" @@ -77296,8 +79584,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -77307,24 +79595,31 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.27, - "output": 0.4, - "cache_read": 0.13 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "novita/glm-4.7-flash", - "name": "glm-4.7-flash", - "display_name": "glm-4.7-flash", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -77335,9 +79630,9 @@ }, "limit": { "context": 200000, - "output": 65500 + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -77345,60 +79640,80 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", + "cost": { + "input": 6, + "output": 24, + "cache_read": 1.3, + "cache_write": 0 + }, "type": "chat" }, { - "id": "novita/glm-4.7-n", - "name": "glm-4.7-n", - "display_name": "glm-4.7-n", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 205000, - "output": 131072 + "context": 128000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", + "cost": { + "input": 2.5, + "output": 10, + "cache_read": 1.25 + }, "type": "chat" }, { - "id": "novita/kimi-k2-thinking", - "name": "kimi-k2-thinking", - "display_name": "kimi-k2-thinking", + "id": "qwen3-vl-plus", + "name": "Qwen3-VL Plus", + "display_name": "Qwen3-VL Plus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 262144, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -77415,16 +79730,22 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-07", - "last_updated": "2025-11-07", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", + "cost": { + "input": 0.2, + "output": 1.6, + "reasoning": 4.8 + }, "type": "chat" }, { - "id": "fireworks-ai/kimi-k2.5-fw", - "name": "Kimi-K2.5-FW", - "display_name": "Kimi-K2.5-FW", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", @@ -77435,59 +79756,102 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0, - "output": 0 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "empiriolabs/deepseek-v4-pro-el", - "name": "DeepSeek-V4-Pro-EL", - "display_name": "DeepSeek-V4-Pro-EL", + "id": "mimo-v2-omni", + "name": "MiMo-V2-Omni", + "display_name": "MiMo-V2-Omni", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 262144, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-24", - "last_updated": "2026-05-02", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1.67, - "output": 3.33 + "input": 0.4, + "output": 2, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "empiriolabs/deepseek-v4-flash-el", - "name": "DeepSeek-V4-Flash-EL", - "display_name": "DeepSeek-V4-Flash-EL", + "id": "gpt-3.5-turbo", + "name": "GPT-3.5-turbo", + "display_name": "GPT-3.5-turbo", "modalities": { "input": [ "text" @@ -77497,122 +79861,125 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 16385, + "output": 4096 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-24", - "last_updated": "2026-05-02", + "attachment": false, + "open_weights": false, + "knowledge": "2021-09-01", + "release_date": "2023-03-01", + "last_updated": "2023-11-06", "cost": { - "input": 0.14, - "output": 0.28 + "input": 0.5, + "output": 1.5, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "elevenlabs/elevenlabs-v2.5-turbo", - "name": "ElevenLabs-v2.5-Turbo", - "display_name": "ElevenLabs-v2.5-Turbo", + "id": "gemini-3.1-flash-lite", + "name": "Gemini 3.1 Flash Lite", + "display_name": "Gemini 3.1 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ - "audio" - ] - }, - "limit": { - "context": 128000, - "output": 8192 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2024-10-28", - "last_updated": "2024-10-28", - "type": "chat" - }, - { - "id": "elevenlabs/elevenlabs-v3", - "name": "ElevenLabs-v3", - "display_name": "ElevenLabs-v3", - "modalities": { - "input": [ "text" - ], - "output": [ - "audio" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "knowledge": "2025-01", + "release_date": "2026-05-07", + "last_updated": "2026-05-07", + "cost": { + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 + }, "type": "chat" }, { - "id": "elevenlabs/elevenlabs-music", - "name": "ElevenLabs-Music", - "display_name": "ElevenLabs-Music", + "id": "claude-haiku-4-5-20251001", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 2000, - "output": 8192 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-08-29", - "last_updated": "2025-08-29", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "cost": { + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + }, "type": "chat" }, { - "id": "cerebras/gpt-oss-120b-cs", - "name": "GPT-OSS-120B-CS", - "display_name": "GPT-OSS-120B-CS", + "id": "grok-4-3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 30000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -77620,105 +79987,199 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", + "release_date": "2026-05-01", + "last_updated": "2026-05-01", "cost": { - "input": 0.35, - "output": 0.75 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2, + "context_over_200k": { + "input": 2.5, + "output": 5, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 2.5, + "output": 5, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "cerebras/llama-3.1-8b-cs", - "name": "Llama-3.1-8B-CS", - "display_name": "Llama-3.1-8B-CS", + "id": "gpt-5.4-nano", + "name": "GPT-5.4 nano", + "display_name": "GPT-5.4 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-05-13", - "last_updated": "2025-05-13", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "cerebras/qwen3-32b-cs", - "name": "qwen3-32b-cs", - "display_name": "qwen3-32b-cs", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "release_date": "2025-05-15", - "last_updated": "2025-05-15", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + }, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ] + }, "type": "chat" }, { - "id": "cerebras/qwen3-235b-2507-cs", - "name": "qwen3-235b-2507-cs", - "display_name": "qwen3-235b-2507-cs", + "id": "gpt-5-chat-latest", + "name": "GPT-5 Chat (latest)", + "display_name": "GPT-5 Chat (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.25, + "output": 10 + }, "type": "chat" }, { - "id": "cerebras/llama-3.3-70b-cs", - "name": "llama-3.3-70b-cs", - "display_name": "llama-3.3-70b-cs", + "id": "minimax-m2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ "text" @@ -77728,62 +80189,46 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 196608, + "output": 128000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-13", - "last_updated": "2025-05-13", - "type": "chat" - }, - { - "id": "stabilityai/stablediffusionxl", - "name": "StableDiffusionXL", - "display_name": "StableDiffusionXL", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "image" - ] + "supported": true, + "default": true }, - "limit": { - "context": 200, - "output": 8192 + "extra_capabilities": { + "reasoning": { + "supported": true + } }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": false + "attachment": false, + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "cost": { + "input": 0.3, + "output": 1.2 }, - "attachment": true, - "open_weights": false, - "release_date": "2023-07-09", - "last_updated": "2023-07-09", "type": "chat" }, { - "id": "xai/grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "gpt-5.5-pro", + "name": "GPT-5.5 Pro", + "display_name": "GPT-5.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 1050000, "output": 128000 }, "temperature": false, @@ -77799,19 +80244,33 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-08-22", - "last_updated": "2025-08-22", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 30, + "output": 180, + "context_over_200k": { + "input": 60, + "output": 270 + }, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "xai/grok-4-fast-reasoning", - "name": "Grok-4-Fast-Reasoning", - "display_name": "Grok-4-Fast-Reasoning", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex mini", + "display_name": "GPT-5.1 Codex mini", "modalities": { "input": [ "text", @@ -77822,63 +80281,96 @@ ] }, "limit": { - "context": 2000000, + "context": 400000, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-09-16", - "last_updated": "2025-09-16", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "xai/grok-4.1-fast-non-reasoning", - "name": "Grok-4.1-Fast-Non-Reasoning", - "display_name": "Grok-4.1-Fast-Non-Reasoning", + "id": "qwq-plus", + "name": "QwQ Plus", + "display_name": "QwQ Plus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "knowledge": "2024-04", + "release_date": "2025-03-05", + "last_updated": "2025-03-05", + "cost": { + "input": 0.8, + "output": 2.4 + }, "type": "chat" }, { - "id": "xai/grok-4", - "name": "Grok-4", - "display_name": "Grok-4", + "id": "gpt-5.2-pro", + "name": "GPT-5.2 Pro", + "display_name": "GPT-5.2 Pro", "modalities": { "input": [ "text", @@ -77889,7 +80381,7 @@ ] }, "limit": { - "context": 256000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -77900,24 +80392,39 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-07-10", - "last_updated": "2025-07-10", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "xai/grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -77927,34 +80434,45 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 384000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-11", - "last_updated": "2025-04-11", - "cost": { - "input": 0.3, - "output": 0.5, - "cache_read": 0.075 - }, - "type": "chat" - }, - { - "id": "xai/grok-4.20-multi-agent", - "name": "Grok-4.20-Multi-Agent", - "display_name": "Grok-4.20-Multi-Agent", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", + "cost": { + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 + }, + "type": "chat" + }, + { + "id": "sonar", + "name": "Sonar", + "display_name": "Sonar", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -77962,340 +80480,398 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-13", - "last_updated": "2026-03-13", + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2 + "input": 1, + "output": 1 }, "type": "chat" }, { - "id": "xai/grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "release_date": "2025-04-11", - "last_updated": "2025-04-11", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { "input": 3, "output": 15, - "cache_read": 0.75 + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "xai/grok-4-fast-non-reasoning", - "name": "Grok-4-Fast-Non-Reasoning", - "display_name": "Grok-4-Fast-Non-Reasoning", + "id": "qwen35-397b-a17b", + "name": "Qwen3.5 397B-A17B", + "display_name": "Qwen3.5 397B-A17B", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2025-09-16", - "last_updated": "2025-09-16", + "open_weights": true, + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "xai/grok-4.1-fast-reasoning", - "name": "Grok-4.1-Fast-Reasoning", - "display_name": "Grok-4.1-Fast-Reasoning", + "id": "glm-4.7-flashx", + "name": "GLM-4.7-FlashX", + "display_name": "GLM-4.7-FlashX", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 200000, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", + "cost": { + "input": 0.07, + "output": 0.4, + "cache_read": 0.01, + "cache_write": 0 + }, "type": "chat" }, { - "id": "runwayml/runway", - "name": "Runway", - "display_name": "Runway", + "id": "qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 256, - "output": 8192 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "release_date": "2024-10-11", - "last_updated": "2024-10-11", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", + "cost": { + "input": 1.2, + "output": 6 + }, "type": "chat" }, { - "id": "runwayml/runway-gen-4-turbo", - "name": "Runway-Gen-4-Turbo", - "display_name": "Runway-Gen-4-Turbo", + "id": "devstral-2512", + "name": "Devstral 2", + "display_name": "Devstral 2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 256, - "output": 8192 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-09", - "last_updated": "2025-05-09", + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", + "cost": { + "input": 0.4, + "output": 2 + }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-max", - "name": "GPT-5.1-Codex-Max", - "display_name": "GPT-5.1-Codex-Max", + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 98304 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/sora-2-pro", - "name": "Sora-2-Pro", - "display_name": "Sora-2-Pro", + "id": "mimo-v2.5-pro", + "name": "MiMo-V2.5-Pro", + "display_name": "MiMo-V2.5-Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048576, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", + "cost": { + "input": 1, + "output": 3, + "cache_read": 0.2, + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ] }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-06", - "last_updated": "2025-10-06", "type": "chat" }, { - "id": "openai/chatgpt-4o-latest", - "name": "ChatGPT-4o-Latest", - "display_name": "ChatGPT-4o-Latest", + "id": "minimax-m2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-08-14", - "last_updated": "2024-08-14", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 4.5, - "output": 14 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "openai/gpt-5-chat", - "name": "GPT-5-Chat", - "display_name": "GPT-5-Chat", + "id": "glm-4.5v", + "name": "GLM-4.5V", + "display_name": "GLM-4.5V", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 64000, "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 + "input": 0.6, + "output": 1.8 }, "type": "chat" }, { - "id": "openai/gpt-5.2-pro", - "name": "GPT-5.2-Pro", - "display_name": "GPT-5.2-Pro", + "id": "glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -78303,150 +80879,150 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 19, - "output": 150 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/gpt-4o-aug", - "name": "GPT-4o-Aug", - "display_name": "GPT-4o-Aug", + "id": "qwen-flash", + "name": "Qwen Flash", + "display_name": "Qwen Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "release_date": "2024-11-21", - "last_updated": "2024-11-21", + "knowledge": "2024-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 2.2, - "output": 9, - "cache_read": 1.1 + "input": 0.05, + "output": 0.4 }, "type": "chat" }, { - "id": "openai/gpt-image-2", - "name": "GPT-Image-2", - "display_name": "GPT-Image-2", + "id": "devstral-small-2507", + "name": "Devstral Small", + "display_name": "Devstral Small", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 128000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2025-07-10", + "last_updated": "2025-07-10", "cost": { - "input": 5.0505, - "output": 32.3232, - "cache_read": 1.2626 + "input": 0.1, + "output": 0.3 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-4-classic-0314", - "name": "GPT-4-Classic-0314", - "display_name": "GPT-4-Classic-0314", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 1047576, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2024-08-26", - "last_updated": "2024-08-26", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 27, - "output": 54 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5-mini", - "display_name": "GPT-5-mini", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -78454,109 +81030,74 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-25", - "last_updated": "2025-06-25", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.22, - "output": 1.8, - "cache_read": 0.022 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "GPT-5-nano", - "display_name": "GPT-5-nano", + "id": "glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 98304 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.045, - "output": 0.36, - "cache_read": 0.0045 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/gpt-5.3-codex", - "name": "GPT-5.3-Codex", - "display_name": "GPT-5.3-Codex", + "id": "qwen-turbo", + "name": "Qwen Turbo", + "display_name": "Qwen Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -78565,85 +81106,77 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-02-10", - "last_updated": "2026-02-10", + "knowledge": "2024-04", + "release_date": "2024-11-01", + "last_updated": "2025-04-28", "cost": { - "input": 1.6, - "output": 13, - "cache_read": 0.16 + "input": 0.05, + "output": 0.2, + "reasoning": 0.5 }, "type": "chat" }, { - "id": "openai/gpt-4-turbo", - "name": "GPT-4-Turbo", - "display_name": "GPT-4-Turbo", + "id": "qwen-max", + "name": "Qwen Max", + "display_name": "Qwen Max", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 32768, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2023-09-13", - "last_updated": "2023-09-13", + "knowledge": "2024-04", + "release_date": "2024-04-03", + "last_updated": "2025-01-25", "cost": { - "input": 9, - "output": 27 + "input": 1.6, + "output": 6.4 }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -78653,39 +81186,45 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 1.6, - "output": 13, - "cache_read": 0.16 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "openai/o3-pro", - "name": "o3-pro", - "display_name": "o3-pro", + "id": "gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ "text", @@ -78696,8 +81235,8 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 400000, + "output": 272000 }, "temperature": false, "tool_call": true, @@ -78709,9 +81248,10 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -78721,32 +81261,64 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-06-10", - "last_updated": "2025-06-10", + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 18, - "output": 72 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "openai/o3-mini-high", - "name": "o3-mini-high", - "display_name": "o3-mini-high", + "id": "gemma-3n-e2b-it", + "name": "Gemma 3n 2B", + "display_name": "Gemma 3n 2B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 8192, + "output": 2000 }, - "temperature": false, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + }, + { + "id": "minimax-m2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -78755,64 +81327,65 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.99, - "output": 4 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o-mini", - "display_name": "GPT-4o-mini", + "id": "gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 124096, - "output": 4096 + "context": 1047576, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.14, - "output": 0.54, - "cache_read": 0.068 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "openai/o4-mini-deep-research", - "name": "o4-mini-deep-research", - "display_name": "o4-mini-deep-research", + "id": "gemma-3n-e4b-it", + "name": "Gemma 3n 4B", + "display_name": "Gemma 3n 4B", "modalities": { "input": [ "text" @@ -78822,58 +81395,46 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 8192, + "output": 2000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-06-27", - "last_updated": "2025-06-27", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 1.8, - "output": 7.2, - "cache_read": 0.45 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-5.4-mini", - "name": "GPT-5.4-Mini", - "display_name": "GPT-5.4-Mini", + "id": "gemini-2.5-flash-lite-preview-09-2025", + "name": "Gemini 2.5 Flash Lite Preview 09-25", + "display_name": "Gemini 2.5 Flash Lite Preview 09-25", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -78883,80 +81444,110 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-03-12", - "last_updated": "2026-03-12", + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.68, - "output": 4, - "cache_read": 0.068 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "openai/dall-e-3", - "name": "DALL-E-3", - "display_name": "DALL-E-3", + "id": "gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 800, - "output": 8192 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": true, - "open_weights": false, - "release_date": "2023-11-06", - "last_updated": "2023-11-06", - "type": "imageGeneration" - }, - { - "id": "openai/o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", - "modalities": { - "input": [ - "text", - "image" - ], + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.01, + "input_audio": 0.3 + }, + "type": "chat" + }, + { + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", + "modalities": { + "input": [ + "text", + "image", + "video" + ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1000000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -78965,32 +81556,49 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.99, - "output": 4, - "cache_read": 0.25 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 0.625, + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5 + }, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5, + "tier": { + "type": "context", + "size": 256000 + } + } + ] }, "type": "chat" }, { - "id": "openai/gpt-5.4-nano", - "name": "GPT-5.4-Nano", - "display_name": "GPT-5.4-Nano", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ "text", @@ -79020,8 +81628,7 @@ "none", "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -79034,47 +81641,20 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-03-11", - "last_updated": "2026-03-11", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.18, - "output": 1.1, - "cache_read": 0.018 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "openai/gpt-image-1", - "name": "GPT-Image-1", - "display_name": "GPT-Image-1", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "image" - ] - }, - "limit": { - "context": 128000, - "output": 8192 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-03-31", - "last_updated": "2025-03-31", - "type": "imageGeneration" - }, - { - "id": "openai/gpt-5.2-codex", - "name": "GPT-5.2-Codex", - "display_name": "GPT-5.2-Codex", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ "text", @@ -79101,10 +81681,10 @@ "mode": "effort", "effort": "medium", "effort_options": [ + "minimal", "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -79117,19 +81697,20 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 1.6, - "output": 13, - "cache_read": 0.16 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-mini", - "name": "GPT-5.1-Codex-Mini", - "display_name": "GPT-5.1-Codex-Mini", + "id": "qwen3-coder-flash", + "name": "Qwen3 Coder Flash", + "display_name": "Qwen3 Coder Flash", "modalities": { "input": [ "text" @@ -79139,62 +81720,41 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-12", - "last_updated": "2025-11-12", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.22, - "output": 1.8, - "cache_read": 0.022 + "input": 0.3, + "output": 1.5 }, "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1050000, "output": 128000 }, "temperature": false, @@ -79213,7 +81773,8 @@ "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -79226,47 +81787,55 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-11-12", - "last_updated": "2025-11-12", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "openai/gpt-image-1-mini", - "name": "GPT-Image-1-Mini", - "display_name": "GPT-Image-1-Mini", + "id": "gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2025-08-26", - "type": "imageGeneration" + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 + }, + "type": "chat" }, { - "id": "openai/o1", - "name": "o1", - "display_name": "o1", + "id": "gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ "text", @@ -79277,128 +81846,110 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2024-12-18", - "last_updated": "2024-12-18", + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 14, - "output": 54 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "openai/gpt-5.4-pro", - "name": "GPT-5.4-Pro", - "display_name": "GPT-5.4-Pro", + "id": "claude-3-5-sonnet-20241022", + "name": "Claude Sonnet 3.5 v2", + "display_name": "Claude Sonnet 3.5 v2", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 200000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 27, - "output": 160 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo", - "name": "GPT-3.5-Turbo", - "display_name": "GPT-3.5-Turbo", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 2048 + "context": 131072, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2023-09-13", - "last_updated": "2023-09-13", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.45, - "output": 1.4 + "input": 0.7, + "output": 2.8, + "reasoning": 8.4 }, "type": "chat" }, { - "id": "openai/o3-deep-research", - "name": "o3-deep-research", - "display_name": "o3-deep-research", + "id": "qwen3-next-80b-a3b-thinking", + "name": "Qwen3-Next 80B-A3B (Thinking)", + "display_name": "Qwen3-Next 80B-A3B (Thinking)", "modalities": { "input": [ "text" @@ -79408,10 +81959,10 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -79420,36 +81971,34 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-27", - "last_updated": "2025-06-27", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 9, - "output": 36, - "cache_read": 2.2 + "input": 0.5, + "output": 6 }, "type": "chat" }, { - "id": "openai/o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "claude-opus-4-5-20251101", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -79457,56 +82006,44 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "knowledge": "2025-03-31", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { - "input": 0.99, - "output": 4 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openai/o1-pro", - "name": "o1-pro", - "display_name": "o1-pro", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -79515,128 +82052,114 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-03-19", - "last_updated": "2025-03-19", + "attachment": false, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 140, - "output": 540 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "openai/gpt-4o-search", - "name": "GPT-4o-Search", - "display_name": "GPT-4o-Search", + "id": "gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "display_name": "Gemini 2.0 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 1048576, "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-03-11", - "last_updated": "2025-03-11", + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 2.2, - "output": 9 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "openai/gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "claude-opus-4-20250514", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 1.1, - "output": 9 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "openai/gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "gpt-5.4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 1050000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -79669,19 +82192,20 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 2.2, - "output": 14, - "cache_read": 0.22 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "openai/gpt-5.3-codex-spark", - "name": "GPT-5.3-Codex-Spark", - "display_name": "GPT-5.3-Codex-Spark", + "id": "kimi-k2-thinking-turbo", + "name": "Kimi K2 Thinking Turbo", + "display_name": "Kimi K2 Thinking Turbo", "modalities": { "input": [ "text" @@ -79691,10 +82215,10 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -79703,107 +82227,117 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-04", - "last_updated": "2026-03-04", + "attachment": false, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0, - "output": 0 + "input": 1.15, + "output": 8, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo-raw", - "name": "GPT-3.5-Turbo-Raw", - "display_name": "GPT-3.5-Turbo-Raw", + "id": "mimo-v2-flash", + "name": "MiMo-V2-Flash", + "display_name": "MiMo-V2-Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 4524, - "output": 2048 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2023-09-27", - "last_updated": "2023-09-27", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", "cost": { - "input": 0.45, - "output": 1.4 + "input": 0.1, + "output": 0.3, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "openai/gpt-4.1-nano", - "name": "GPT-4.1-nano", - "display_name": "GPT-4.1-nano", + "id": "claude-sonnet-4-5-20250929", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.09, - "output": 0.36, - "cache_read": 0.022 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "openai/o3", - "name": "o3", - "display_name": "o3", + "id": "o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -79835,33 +82369,33 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 1.8, - "output": 7.2, - "cache_read": 0.45 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "openai/gpt-5-pro", - "name": "GPT-5-Pro", - "display_name": "GPT-5-Pro", + "id": "mimo-v2-pro", + "name": "MiMo-V2-Pro", + "display_name": "MiMo-V2-Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -79870,155 +82404,165 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 14, - "output": 110 + "input": 1, + "output": 3, + "cache_read": 0.2, + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ] }, "type": "chat" }, { - "id": "openai/sora-2", - "name": "Sora-2", - "display_name": "Sora-2", + "id": "qwen-vl-plus", + "name": "Qwen-VL Plus", + "display_name": "Qwen-VL Plus", "modalities": { "input": [ "text", "image" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, + "context": 131072, "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-08-15", + "cost": { + "input": 0.21, + "output": 0.63 + }, "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "qwen-omni-turbo", + "name": "Qwen-Omni Turbo", + "display_name": "Qwen-Omni Turbo", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 32768, + "output": 2048 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "knowledge": "2024-04", + "release_date": "2025-01-19", + "last_updated": "2025-03-26", + "cost": { + "input": 0.07, + "output": 0.27, + "input_audio": 4.44, + "output_audio": 8.89 + }, "type": "chat" }, { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "glm-4.5-flash", + "name": "GLM-4.5-Flash", + "display_name": "GLM-4.5-Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 98304 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/gpt-5.2-instant", - "name": "GPT-5.2-Instant", - "display_name": "GPT-5.2-Instant", + "id": "claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -80031,129 +82575,266 @@ "supported": true, "default_enabled": false, "mode": "effort", - "effort": "none", + "effort": "high", "effort_options": [ - "none", "low", "medium", "high", "xhigh" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 1.6, - "output": 13, - "cache_read": 0.16 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini-search", - "name": "GPT-4o-mini-Search", - "display_name": "GPT-4o-mini-Search", + "id": "mimo-v2.5", + "name": "MiMo-V2.5", + "display_name": "MiMo-V2.5", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1048576, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "release_date": "2025-03-11", - "last_updated": "2025-03-11", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.14, - "output": 0.54 + "input": 0.4, + "output": 2, + "cache_read": 0.08, + "context_over_200k": { + "input": 0.8, + "output": 4, + "cache_read": 0.16 + }, + "tiers": [ + { + "input": 0.8, + "output": 4, + "cache_read": 0.16, + "tier": { + "type": "context", + "size": 256000 + } + } + ] }, "type": "chat" }, { - "id": "openai/gpt-image-1.5", - "name": "gpt-image-1.5", - "display_name": "gpt-image-1.5", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 384000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-16", - "last_updated": "2025-12-16", - "type": "imageGeneration" - }, - { - "id": "openai/gpt-3.5-turbo-instruct", - "name": "GPT-3.5-Turbo-Instruct", - "display_name": "GPT-3.5-Turbo-Instruct", - "modalities": { - "input": [ - "text", - "image" + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", + "cost": { + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 + }, + "type": "chat" + }, + { + "id": "gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 3500, - "output": 1024 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "release_date": "2023-09-20", - "last_updated": "2023-09-20", + "knowledge": "2025-01", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 1.4, - "output": 1.8 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", + "cost": { + "input": 2, + "output": 12, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] + }, + "type": "chat" + }, + { + "id": "grok-4-20-beta-0309-reasoning", + "name": "Grok 4.20 (Reasoning)", + "display_name": "Grok 4.20 (Reasoning)", "modalities": { "input": [ "text", @@ -80164,29 +82845,46 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 2000000, + "output": 30000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2026-03-09", + "last_updated": "2026-03-09", "cost": { - "input": 1.8, - "output": 7.2, - "cache_read": 0.45 + "input": 2, + "output": 6, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 12, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 4, + "output": 12, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "openai/gpt-5.1-instant", - "name": "GPT-5.1-Instant", - "display_name": "GPT-5.1-Instant", + "id": "mistral-small-2506", + "name": "Mistral Small 3.2", + "display_name": "Mistral Small 3.2", "modalities": { "input": [ "text", @@ -80200,23 +82898,57 @@ "context": 128000, "output": 16384 }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-03", + "release_date": "2025-06-20", + "last_updated": "2025-06-20", + "cost": { + "input": 0.1, + "output": 0.3 + }, + "type": "chat" + }, + { + "id": "gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1050000, + "output": 128000 + }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -80229,84 +82961,140 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-11-12", - "last_updated": "2025-11-12", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 + "input": 5, + "output": 30, + "cache_read": 0.5, + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + }, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1-mini", - "display_name": "GPT-4.1-mini", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.36, - "output": 1.4, - "cache_read": 0.09 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "input_audio": 1 }, "type": "chat" }, { - "id": "openai/gpt-4-classic", - "name": "GPT-4-Classic", - "display_name": "GPT-4-Classic", + "id": "qwen3.6-35b-a3b", + "name": "Qwen3.6 35B-A3B", + "display_name": "Qwen3.6 35B-A3B", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "release_date": "2024-03-25", - "last_updated": "2024-03-25", + "open_weights": true, + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 27, - "output": 54 + "input": 0.248, + "output": 1.485 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex", - "name": "GPT-5.1-Codex", - "display_name": "GPT-5.1-Codex", + "id": "gpt-5.4-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ "text", @@ -80317,26 +83105,25 @@ ] }, "limit": { - "context": 400000, + "context": 1050000, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "high", "effort_options": [ - "none", - "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -80349,19 +83136,19 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-11-12", - "last_updated": "2025-11-12", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 + "input": 30, + "output": 180 }, "type": "chat" }, { - "id": "openai/gpt-5.3-instant", - "name": "GPT-5.3-Instant", - "display_name": "GPT-5.3-Instant", + "id": "gpt-5.2-chat-latest", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ "text", @@ -80378,240 +83165,235 @@ "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 1.6, - "output": 13, - "cache_read": 0.16 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "google/veo-3-fast", - "name": "Veo-3-Fast", - "display_name": "Veo-3-Fast", + "id": "mistral-large-latest", + "name": "Mistral Large (latest)", + "display_name": "Mistral Large (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-10-13", - "last_updated": "2025-10-13", + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", + "cost": { + "input": 0.5, + "output": 1.5 + }, "type": "chat" }, { - "id": "google/veo-3.1-fast", - "name": "Veo-3.1-Fast", - "display_name": "Veo-3.1-Fast", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "Qwen3-Coder 480B-A35B Instruct", + "display_name": "Qwen3-Coder 480B-A35B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", + "cost": { + "input": 1.5, + "output": 7.5 + }, "type": "chat" }, { - "id": "google/gemini-3.1-pro", - "name": "Gemini-3.1-Pro", - "display_name": "Gemini-3.1-Pro", + "id": "sonar-reasoning-pro", + "name": "Sonar Reasoning Pro", + "display_name": "Sonar Reasoning Pro", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, "open_weights": false, - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { "input": 2, - "output": 12, - "cache_read": 0.2 + "output": 8 }, "type": "chat" }, { - "id": "google/imagen-3-fast", - "name": "Imagen-3-Fast", - "display_name": "Imagen-3-Fast", + "id": "gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 1047576, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2024-10-17", - "last_updated": "2024-10-17", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 + }, "type": "chat" }, { - "id": "google/gemini-2.0-flash", - "name": "Gemini-2.0-Flash", - "display_name": "Gemini-2.0-Flash", + "id": "gemma-3-12b-it", + "name": "Gemma 3 12B", + "display_name": "Gemma 3 12B", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 990000, + "context": 32768, "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 0.1, - "output": 0.42 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemini-deep-research", - "name": "gemini-deep-research", - "display_name": "gemini-deep-research", + "id": "gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 8192, "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 1.6, - "output": 9.6 + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini-2.5-Pro", - "display_name": "Gemini-2.5-Pro", + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1065535, - "output": 65535 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -80623,113 +83405,158 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2025-02-05", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.87, - "output": 7, - "cache_read": 0.087 + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 }, "type": "chat" }, { - "id": "google/imagen-3", - "name": "Imagen-3", - "display_name": "Imagen-3", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2024-10-15", - "last_updated": "2024-10-15", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + }, "type": "chat" }, { - "id": "google/nano-banana", - "name": "Nano-Banana", - "display_name": "Nano-Banana", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.21, - "output": 1.8, - "cache_read": 0.021 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini-2.5-Flash", - "display_name": "Gemini-2.5-Flash", + "id": "qwen3.6-max-preview", + "name": "Qwen3.6 Max Preview", + "display_name": "Qwen3.6 Max Preview", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1065535, - "output": 65535 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -80738,44 +83565,38 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-04-26", - "last_updated": "2025-04-26", + "knowledge": "2025-04", + "release_date": "2026-04-20", + "last_updated": "2026-04-20", "cost": { - "input": 0.21, - "output": 1.8, - "cache_read": 0.021 + "input": 1.3, + "output": 7.8, + "cache_read": 0.13, + "cache_write": 1.625 }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-lite", - "name": "Gemini-3.1-Flash-Lite", - "display_name": "Gemini-3.1-Flash-Lite", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", + "audio", "video", - "audio" + "pdf" ], "output": [ "text" @@ -80785,7 +83606,7 @@ "context": 1048576, "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -80793,37 +83614,53 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-18", - "last_updated": "2026-02-18", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.25, - "output": 1.5 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 }, "type": "chat" }, { - "id": "google/gemini-3-flash", - "name": "Gemini-3-Flash", - "display_name": "Gemini-3-Flash", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -80835,459 +83672,532 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ + "mode": "effort", + "effort": "medium", + "effort_options": [ "minimal", "low", "medium", "high" ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-07", - "last_updated": "2025-10-07", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.4, - "output": 2.4, - "cache_read": 0.04 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "google/veo-3.1", - "name": "Veo-3.1", - "display_name": "Veo-3.1", + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" ], "output": [ - "video" - ] - }, - "limit": { - "context": 480, - "output": 8192 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", - "type": "chat" - }, - { - "id": "google/lyria", - "name": "Lyria", - "display_name": "Lyria", - "modalities": { - "input": [ "text" - ], - "output": [ - "audio" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-04", - "last_updated": "2025-06-04", - "type": "chat" - }, - { - "id": "google/imagen-4-ultra", - "name": "Imagen-4-Ultra", - "display_name": "Imagen-4-Ultra", - "modalities": { - "input": [ - "text" - ], - "output": [ - "image" - ] - }, - "limit": { - "context": 480, - "output": 8192 + "supported": true, + "default": true }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-24", - "last_updated": "2025-05-24", + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + }, "type": "chat" }, { - "id": "google/nano-banana-pro", - "name": "Nano-Banana-Pro", - "display_name": "Nano-Banana-Pro", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "google/gemini-3-pro", - "name": "Gemini-3-Pro", - "display_name": "Gemini-3-Pro", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", "image", - "video", - "audio" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ "low", + "medium", "high" ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-22", - "last_updated": "2025-10-22", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 1.6, - "output": 9.6, - "cache_read": 0.16 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "google/imagen-4-fast", - "name": "Imagen-4-Fast", - "display_name": "Imagen-4-Fast", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder 30B-A3B Instruct", + "display_name": "Qwen3-Coder 30B-A3B Instruct", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-25", - "last_updated": "2025-06-25", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", + "cost": { + "input": 0.45, + "output": 2.25 + }, "type": "chat" }, { - "id": "google/veo-3", - "name": "Veo-3", - "display_name": "Veo-3", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-05-21", - "last_updated": "2025-05-21", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-lite", - "name": "Gemini-2.5-Flash-Lite", - "display_name": "Gemini-2.5-Flash-Lite", + "id": "qwen3-next-80b-a3b-instruct", + "name": "Qwen3-Next 80B-A3B Instruct", + "display_name": "Qwen3-Next 80B-A3B Instruct", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1024000, - "output": 64000 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-19", - "last_updated": "2025-06-19", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.5, + "output": 2 }, "type": "chat" }, { - "id": "google/imagen-4", - "name": "Imagen-4", - "display_name": "Imagen-4", + "id": "minimax-m2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "display_name": "MiniMax-M2.5-highspeed", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", + "cost": { + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", "type": "chat" }, { - "id": "google/gemma-4-31b", - "name": "Gemma-4-31B", - "display_name": "Gemma-4-31B", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 8192 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "google/gemini-2.0-flash-lite", - "name": "Gemini-2.0-Flash-Lite", - "display_name": "Gemini-2.0-Flash-Lite", + "id": "gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", "modalities": { "input": [ "text", "image", + "audio", "video", - "audio" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 990000, + "context": 1048576, "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2025-02-05", + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.052, - "output": 0.21 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "google/veo-2", - "name": "Veo-2", - "display_name": "Veo-2", + "id": "claude-3-7-sonnet-20250219", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2024-12-02", - "last_updated": "2024-12-02", + "knowledge": "2024-10-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + }, "type": "chat" }, { - "id": "lumalabs/ray2", - "name": "Ray2", - "display_name": "Ray2", + "id": "o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 5000, - "output": 8192 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-02-20", - "last_updated": "2025-02-20", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "cost": { + "input": 2, + "output": 8, + "cache_read": 0.5 + }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.1", - "name": "Claude-Opus-4.1", - "display_name": "Claude-Opus-4.1", + "id": "claude-sonnet-4-20250514", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ "text", @@ -81299,10 +84209,10 @@ ] }, "limit": { - "context": 196608, - "output": 32000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -81310,440 +84220,418 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 13, - "output": 64, - "cache_read": 1.3, - "cache_write": 16 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-3.5", - "name": "Claude-Sonnet-3.5", - "display_name": "Claude-Sonnet-3.5", + "id": "qwen-vl-max", + "name": "Qwen-VL Max", + "display_name": "Qwen-VL Max", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 189096, + "context": 131072, "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-06-05", - "last_updated": "2024-06-05", + "knowledge": "2024-04", + "release_date": "2024-04-08", + "last_updated": "2025-08-13", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 + "input": 0.8, + "output": 3.2 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-3", - "name": "Claude-Haiku-3", - "display_name": "Claude-Haiku-3", + "id": "gemma-3-4b-it", + "name": "Gemma 3 4B", + "display_name": "Gemma 3 4B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 189096, + "context": 32768, "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2024-03-09", - "last_updated": "2024-03-09", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 0.21, - "output": 1.1, - "cache_read": 0.021, - "cache_write": 0.26 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6", - "name": "Claude-Opus-4.6", - "display_name": "Claude-Opus-4.6", + "id": "qwen-plus", + "name": "Qwen Plus", + "display_name": "Qwen Plus", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 983040, - "output": 128000 + "context": 1000000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-02-04", - "last_updated": "2026-02-04", + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-09-11", "cost": { - "input": 4.3, - "output": 21, - "cache_read": 0.43, - "cache_write": 5.3 + "input": 0.4, + "output": 1.2, + "reasoning": 4 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.7", - "name": "Claude-Opus-4.7", - "display_name": "Claude-Opus-4.7", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], "interleaved": true, "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-15", - "last_updated": "2026-04-15", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 4.3, - "output": 21, - "cache_read": 0.43, - "cache_write": 5.4 + "input": 1, + "output": 3.2, + "cache_read": 0.2, + "cache_write": 0 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude-Sonnet-4", - "display_name": "Claude-Sonnet-4", + "id": "grok-4-20-beta-0309-non-reasoning", + "name": "Grok 4.20 (Non-Reasoning)", + "display_name": "Grok 4.20 (Non-Reasoning)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 983040, - "output": 64000 + "context": 2000000, + "output": 30000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-05-21", - "last_updated": "2025-05-21", + "release_date": "2026-03-09", + "last_updated": "2026-03-09", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 + "input": 2, + "output": 6, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 12, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 4, + "output": 12, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.5", - "name": "Claude-Sonnet-4.5", - "display_name": "Claude-Sonnet-4.5", + "id": "qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 983040, - "output": 32768 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-26", - "last_updated": "2025-09-26", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.5", - "name": "Claude-Opus-4.5", - "display_name": "Claude-Opus-4.5", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 64000 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "release_date": "2025-11-21", - "last_updated": "2025-11-21", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 4.3, - "output": 21, - "cache_read": 0.43, - "cache_write": 5.3 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-3.7", - "name": "Claude-Sonnet-3.7", - "display_name": "Claude-Sonnet-3.7", + "id": "sonar-pro", + "name": "Sonar Pro", + "display_name": "Sonar Pro", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 128000 + "context": 200000, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4", - "name": "Claude-Opus-4", - "display_name": "Claude-Opus-4", + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 192512, - "output": 28672 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2025-05-21", - "last_updated": "2025-05-21", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 13, - "output": 64, - "cache_read": 1.3, - "cache_write": 16 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-3.5", - "name": "Claude-Haiku-3.5", - "display_name": "Claude-Haiku-3.5", + "id": "pixtral-large-latest", + "name": "Pixtral Large (latest)", + "display_name": "Pixtral Large (latest)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 189096, - "output": 8192 + "context": 128000, + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2024-11-04", "cost": { - "input": 0.68, - "output": 3.4, - "cache_read": 0.068, - "cache_write": 0.85 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4.5", - "name": "Claude-Haiku-4.5", - "display_name": "Claude-Haiku-4.5", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 192000, - "output": 64000 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -81751,119 +84639,113 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.85, - "output": 4.3, - "cache_read": 0.085, - "cache_write": 1.1 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-3.5-june", - "name": "Claude-Sonnet-3.5-June", - "display_name": "Claude-Sonnet-3.5-June", + "id": "gpt-5.3-chat-latest", + "name": "GPT-5.3 Chat (latest)", + "display_name": "GPT-5.3 Chat (latest)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 189096, - "output": 8192 + "context": 128000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2024-11-18", - "last_updated": "2024-11-18", + "knowledge": "2025-08-31", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" - }, + } + ] + }, + "poe": { + "id": "poe", + "name": "Poe", + "display_name": "Poe", + "api": "https://api.poe.com/v1", + "doc": "https://creator.poe.com/docs/external-applications/openai-compatible-api", + "models": [ { - "id": "anthropic/claude-sonnet-4.6", - "name": "Claude-Sonnet-4.6", - "display_name": "Claude-Sonnet-4.6", + "id": "ideogramai/ideogram-v2a-turbo", + "name": "Ideogram-v2a-Turbo", + "display_name": "Ideogram-v2a-Turbo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 983040, - "output": 128000 + "context": 150, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", - "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 - }, + "release_date": "2025-02-27", + "last_updated": "2025-02-27", "type": "chat" }, { - "id": "ideogramai/ideogram", - "name": "Ideogram", - "display_name": "Ideogram", + "id": "ideogramai/ideogram-v2", + "name": "Ideogram-v2", + "display_name": "Ideogram-v2", "modalities": { "input": [ "text", @@ -81884,14 +84766,14 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-04-03", - "last_updated": "2024-04-03", + "release_date": "2024-08-21", + "last_updated": "2024-08-21", "type": "chat" }, { - "id": "ideogramai/ideogram-v2", - "name": "Ideogram-v2", - "display_name": "Ideogram-v2", + "id": "ideogramai/ideogram", + "name": "Ideogram", + "display_name": "Ideogram", "modalities": { "input": [ "text", @@ -81912,14 +84794,14 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-08-21", - "last_updated": "2024-08-21", + "release_date": "2024-04-03", + "last_updated": "2024-04-03", "type": "chat" }, { - "id": "ideogramai/ideogram-v2a-turbo", - "name": "Ideogram-v2a-Turbo", - "display_name": "Ideogram-v2a-Turbo", + "id": "ideogramai/ideogram-v2a", + "name": "Ideogram-v2a", + "display_name": "Ideogram-v2a", "modalities": { "input": [ "text" @@ -81944,19 +84826,20 @@ "type": "chat" }, { - "id": "ideogramai/ideogram-v2a", - "name": "Ideogram-v2a", - "display_name": "Ideogram-v2a", + "id": "openai/chatgpt-4o-latest", + "name": "ChatGPT-4o-Latest", + "display_name": "ChatGPT-4o-Latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 150, + "context": 128000, "output": 8192 }, "temperature": false, @@ -81966,24 +84849,29 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27", + "release_date": "2024-08-14", + "last_updated": "2024-08-14", + "cost": { + "input": 4.5, + "output": 14 + }, "type": "chat" }, { - "id": "trytako/tako", - "name": "Tako", - "display_name": "Tako", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 2048, + "context": 128000, "output": 8192 }, "temperature": false, @@ -81993,20 +84881,21 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "type": "chat" }, { - "id": "poetools/claude-code", - "name": "claude-code", - "display_name": "claude-code", + "id": "openai/gpt-image-1-mini", + "name": "GPT-Image-1-Mini", + "display_name": "GPT-Image-1-Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { @@ -82016,27 +84905,25 @@ "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-11-27", - "last_updated": "2025-11-27", - "type": "chat" + "release_date": "2025-08-26", + "last_updated": "2025-08-26", + "type": "imageGeneration" }, { - "id": "openai/gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", "image" ], "output": [ - "text", - "image" + "text" ] }, "limit": { @@ -82047,15 +84934,16 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ + "none", "low", "medium", "high", @@ -82072,64 +84960,51 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 4.5455, - "output": 27.2727, - "cache_read": 0.4545 + "input": 1.6, + "output": 13, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "openai/gpt-5.5-pro", - "name": "GPT-5.5-Pro", - "display_name": "GPT-5.5-Pro", + "id": "openai/gpt-3.5-turbo", + "name": "GPT-3.5-Turbo", + "display_name": "GPT-3.5-Turbo", "modalities": { "input": [ "text", "image" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 2048 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "release_date": "2023-09-13", + "last_updated": "2023-09-13", "cost": { - "input": 27.2727, - "output": 163.6364 + "input": 0.45, + "output": 1.4 }, "type": "chat" - } - ] - }, - "helicone": { - "id": "helicone", - "name": "Helicone", - "display_name": "Helicone", - "api": "https://ai-gateway.helicone.ai/v1", - "doc": "https://helicone.ai/models", - "models": [ + }, { - "id": "mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "openai/o3-pro", + "name": "o3-pro", + "display_name": "o3-pro", "modalities": { "input": [ "text", @@ -82140,29 +85015,43 @@ ] }, "limit": { - "context": 128000, - "output": 16400 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", "cost": { - "input": 20, - "output": 40 + "input": 18, + "output": 72 }, "type": "chat" }, { - "id": "grok-4-1-fast-reasoning", - "name": "xAI Grok 4.1 Fast Reasoning", - "display_name": "xAI Grok 4.1 Fast Reasoning", + "id": "openai/gpt-5.3-instant", + "name": "GPT-5.3-Instant", + "display_name": "GPT-5.3-Instant", "modalities": { "input": [ "text", @@ -82173,167 +85062,231 @@ ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-17", - "last_updated": "2025-11-17", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.19999999999999998, - "output": 0.5, - "cache_read": 0.049999999999999996 + "input": 1.6, + "output": 13, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "gemma2-9b-it", - "name": "Google Gemma 2", - "display_name": "Google Gemma 2", + "id": "openai/sora-2-pro", + "name": "Sora-2-Pro", + "display_name": "Sora-2-Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "video" ] }, "limit": { "context": 8192, "output": 8192 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-25", - "last_updated": "2024-06-25", - "cost": { - "input": 0.01, - "output": 0.03 - }, + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "type": "chat" }, { - "id": "llama-3.3-70b-instruct", - "name": "Meta Llama 3.3 70B Instruct", - "display_name": "Meta Llama 3.3 70B Instruct", + "id": "openai/gpt-5.4-nano", + "name": "GPT-5.4-Nano", + "display_name": "GPT-5.4-Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16400 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2026-03-11", + "last_updated": "2026-03-11", "cost": { - "input": 0.13, - "output": 0.39 + "input": 0.18, + "output": 1.1, + "cache_read": 0.018 }, "type": "chat" }, { - "id": "llama-4-scout", - "name": "Meta Llama 4 Scout 17B 16E", - "display_name": "Meta Llama 4 Scout 17B 16E", + "id": "openai/gpt-image-2", + "name": "GPT-Image-2", + "display_name": "GPT-Image-2", "modalities": { "input": [ "text", "image" ], + "output": [ + "image" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-04-21", + "last_updated": "2026-04-21", + "cost": { + "input": 5.0505, + "output": 32.3232, + "cache_read": 1.2626 + }, + "type": "imageGeneration" + }, + { + "id": "openai/gpt-4o-mini-search", + "name": "GPT-4o-mini-Search", + "display_name": "GPT-4o-mini-Search", + "modalities": { + "input": [ + "text" + ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-03-11", + "last_updated": "2025-03-11", "cost": { - "input": 0.08, - "output": 0.3 + "input": 0.14, + "output": 0.54 }, "type": "chat" }, { - "id": "chatgpt-4o-latest", - "name": "OpenAI ChatGPT-4o", - "display_name": "OpenAI ChatGPT-4o", + "id": "openai/gpt-5.1-codex-mini", + "name": "GPT-5.1-Codex-Mini", + "display_name": "GPT-5.1-Codex-Mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-14", - "last_updated": "2024-08-14", + "release_date": "2025-11-12", + "last_updated": "2025-11-12", "cost": { - "input": 5, - "output": 20, - "cache_read": 2.5 + "input": 0.22, + "output": 1.8, + "cache_read": 0.022 }, "type": "chat" }, { - "id": "claude-3.5-sonnet-v2", - "name": "Anthropic: Claude 3.5 Sonnet v2", - "display_name": "Anthropic: Claude 3.5 Sonnet v2", + "id": "openai/gpt-5.2-pro", + "name": "GPT-5.2-Pro", + "display_name": "GPT-5.2-Pro", "modalities": { "input": [ "text", @@ -82344,165 +85297,209 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.30000000000000004, - "cache_write": 3.75 + "input": 19, + "output": 150 }, "type": "chat" }, { - "id": "hermes-2-pro-llama-3-8b", - "name": "Hermes 2 Pro Llama 3 8B", - "display_name": "Hermes 2 Pro Llama 3 8B", + "id": "openai/gpt-4-classic-0314", + "name": "GPT-4-Classic-0314", + "display_name": "GPT-4-Classic-0314", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 8192, + "output": 4096 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-05-27", - "last_updated": "2024-05-27", + "release_date": "2024-08-26", + "last_updated": "2024-08-26", "cost": { - "input": 0.14, - "output": 0.14 + "input": 27, + "output": 54 }, "type": "chat" }, { - "id": "claude-3.7-sonnet", - "name": "Anthropic: Claude 3.7 Sonnet", - "display_name": "Anthropic: Claude 3.7 Sonnet", + "id": "openai/sora-2", + "name": "Sora-2", + "display_name": "Sora-2", "modalities": { "input": [ "text", "image" ], + "output": [ + "video" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-06", + "last_updated": "2025-10-06", + "type": "chat" + }, + { + "id": "openai/gpt-5.3-codex-spark", + "name": "GPT-5.3-Codex-Spark", + "display_name": "GPT-5.3-Codex-Spark", + "modalities": { + "input": [ + "text" + ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-02", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2026-03-04", + "last_updated": "2026-03-04", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.30000000000000004, - "cache_write": 3.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "llama-prompt-guard-2-22m", - "name": "Meta Llama Prompt Guard 2 22M", - "display_name": "Meta Llama Prompt Guard 2 22M", + "id": "openai/gpt-3.5-turbo-instruct", + "name": "GPT-3.5-Turbo-Instruct", + "display_name": "GPT-3.5-Turbo-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 512, - "output": 2 + "context": 3500, + "output": 1024 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "release_date": "2023-09-20", + "last_updated": "2023-09-20", "cost": { - "input": 0.01, - "output": 0.01 + "input": 1.4, + "output": 1.8 }, "type": "chat" }, { - "id": "o1-mini", - "name": "OpenAI: o1-mini", - "display_name": "OpenAI: o1-mini", + "id": "openai/gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 400000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -82514,6 +85511,13 @@ "mode": "effort", "effort": "medium", "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -82521,22 +85525,48 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "output": 9 }, "type": "chat" }, { - "id": "gpt-4.1-mini-2025-04-14", - "name": "OpenAI GPT-4.1 Mini", - "display_name": "OpenAI GPT-4.1 Mini", + "id": "openai/gpt-image-1.5", + "name": "gpt-image-1.5", + "display_name": "gpt-image-1.5", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-16", + "last_updated": "2025-12-16", + "type": "imageGeneration" + }, + { + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ "text", @@ -82550,40 +85580,40 @@ "context": 1047576, "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", "release_date": "2025-04-14", "last_updated": "2025-04-14", "cost": { - "input": 0.39999999999999997, - "output": 1.5999999999999999, - "cache_read": 0.09999999999999999 + "input": 1.8, + "output": 7.2, + "cache_read": 0.45 }, "type": "chat" }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "openai/gpt-5-pro", + "name": "GPT-5-Pro", + "display_name": "GPT-5-Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -82591,100 +85621,98 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 0.03, - "output": 0.13 + "input": 14, + "output": 110 }, "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1-mini", + "display_name": "GPT-4.1-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 40960 + "context": 1047576, + "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.29, - "output": 0.59 + "input": 0.36, + "output": 1.4, + "cache_read": 0.09 }, "type": "chat" }, { - "id": "llama-3.3-70b-versatile", - "name": "Meta Llama 3.3 70B Versatile", - "display_name": "Meta Llama 3.3 70B Versatile", + "id": "openai/gpt-3.5-turbo-raw", + "name": "GPT-3.5-Turbo-Raw", + "display_name": "GPT-3.5-Turbo-Raw", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32678 + "context": 4524, + "output": 2048 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2023-09-27", + "last_updated": "2023-09-27", "cost": { - "input": 0.59, - "output": 0.7899999999999999 + "input": 0.45, + "output": 1.4 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "OpenAI GPT-5 Mini", - "display_name": "OpenAI GPT-5 Mini", + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ "text", @@ -82702,16 +85730,16 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ - "minimal", + "none", "low", "medium", "high" @@ -82725,22 +85753,21 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-11-12", + "last_updated": "2025-11-12", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.024999999999999998 + "input": 1.1, + "output": 9, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "gpt-5-nano", - "name": "OpenAI GPT-5 Nano", - "display_name": "OpenAI GPT-5 Nano", + "id": "openai/gpt-5-nano", + "name": "GPT-5-nano", + "display_name": "GPT-5-nano", "modalities": { "input": [ "text", @@ -82781,76 +85808,78 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.049999999999999996, - "output": 0.39999999999999997, - "cache_read": 0.005 + "input": 0.045, + "output": 0.36, + "cache_read": 0.0045 }, "type": "chat" }, { - "id": "gemini-3-pro-preview", - "name": "Google Gemini 3 Pro Preview", - "display_name": "Google Gemini 3 Pro Preview", + "id": "openai/gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", "image", - "audio", - "video" + "pdf" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ "low", + "medium", "high" ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.19999999999999998 + "input": 2.2, + "output": 14, + "cache_read": 0.22 }, "type": "chat" }, { - "id": "claude-3-haiku-20240307", - "name": "Anthropic: Claude 3 Haiku", - "display_name": "Anthropic: Claude 3 Haiku", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o-mini", + "display_name": "GPT-4o-mini", "modalities": { "input": [ "text", @@ -82861,31 +85890,29 @@ ] }, "limit": { - "context": 200000, + "context": 124096, "output": 4096 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-03-07", - "last_updated": "2024-03-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 + "input": 0.14, + "output": 0.54, + "cache_read": 0.068 }, "type": "chat" }, { - "id": "llama-4-maverick", - "name": "Meta Llama 4 Maverick 17B 128E", - "display_name": "Meta Llama 4 Maverick 17B 128E", + "id": "openai/o1-pro", + "name": "o1-pro", + "display_name": "o1-pro", "modalities": { "input": [ "text", @@ -82896,29 +85923,43 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-03-19", + "last_updated": "2025-03-19", "cost": { - "input": 0.15, - "output": 0.6 + "input": 140, + "output": 540 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Anthropic: Claude Sonnet 4.5 (20250929)", - "display_name": "Anthropic: Claude Sonnet 4.5 (20250929)", + "id": "openai/gpt-4-turbo", + "name": "GPT-4-Turbo", + "display_name": "GPT-4-Turbo", "modalities": { "input": [ "text", @@ -82929,87 +85970,55 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 4096 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2023-09-13", + "last_updated": "2023-09-13", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.30000000000000004, - "cache_write": 3.75 + "input": 9, + "output": 27 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Google Gemini 2.5 Pro", - "display_name": "Google Gemini 2.5 Pro", + "id": "openai/dall-e-3", + "name": "DALL-E-3", + "display_name": "DALL-E-3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 800, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.3125, - "cache_write": 1.25 - }, - "type": "chat" + "release_date": "2023-11-06", + "last_updated": "2023-11-06", + "type": "imageGeneration" }, { - "id": "claude-4.5-opus", - "name": "Anthropic: Claude Opus 4.5", - "display_name": "Anthropic: Claude Opus 4.5", + "id": "openai/gpt-5.4-mini", + "name": "GPT-5.4-Mini", + "display_name": "GPT-5.4-Mini", "modalities": { "input": [ "text", @@ -83020,102 +86029,111 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "release_date": "2026-03-12", + "last_updated": "2026-03-12", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.68, + "output": 4, + "cache_read": 0.068 }, "type": "chat" }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "xAI Grok 4.1 Fast Non-Reasoning", - "display_name": "xAI Grok 4.1 Fast Non-Reasoning", + "id": "openai/gpt-5.1-instant", + "name": "GPT-5.1-Instant", + "display_name": "GPT-5.1-Instant", "modalities": { "input": [ "text", "image" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-17", - "last_updated": "2025-11-17", - "cost": { - "input": 0.19999999999999998, - "output": 0.5, - "cache_read": 0.049999999999999996 - }, - "type": "chat" - }, - { - "id": "sonar-pro", - "name": "Perplexity Sonar Pro", - "display_name": "Perplexity Sonar Pro", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 4096 + "supported": true, + "default": false }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2025-01-27", + "release_date": "2025-11-12", + "last_updated": "2025-11-12", "cost": { - "input": 3, - "output": 15 + "input": 1.1, + "output": 9, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "mistral-large-2411", - "name": "Mistral-Large", - "display_name": "Mistral-Large", + "id": "openai/gpt-4o-aug", + "name": "GPT-4o-Aug", + "display_name": "GPT-4o-Aug", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -83123,28 +86141,28 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-24", - "last_updated": "2024-07-24", + "release_date": "2024-11-21", + "last_updated": "2024-11-21", "cost": { - "input": 2, - "output": 6 + "input": 2.2, + "output": 9, + "cache_read": 1.1 }, "type": "chat" }, { - "id": "o3-pro", - "name": "OpenAI o3 Pro", - "display_name": "OpenAI o3 Pro", + "id": "openai/o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ "text", @@ -83178,21 +86196,20 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2024-12-18", + "last_updated": "2024-12-18", "cost": { - "input": 20, - "output": 80 + "input": 14, + "output": 54 }, "type": "chat" }, { - "id": "claude-opus-4-1", - "name": "Anthropic: Claude Opus 4.1", - "display_name": "Anthropic: Claude Opus 4.1", + "id": "openai/o3-mini-high", + "name": "o3-mini-high", + "display_name": "o3-mini-high", "modalities": { "input": [ "text", @@ -83204,9 +86221,9 @@ }, "limit": { "context": 200000, - "output": 32000 + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -83214,26 +86231,32 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-08", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.99, + "output": 4 }, "type": "chat" }, { - "id": "gpt-4o-mini", - "name": "OpenAI GPT-4o-mini", - "display_name": "OpenAI GPT-4o-mini", + "id": "openai/gpt-4-classic", + "name": "GPT-4-Classic", + "display_name": "GPT-4-Classic", "modalities": { "input": [ "text", @@ -83244,109 +86267,126 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8192, + "output": 4096 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2024-03-25", + "last_updated": "2024-03-25", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 + "input": 27, + "output": 54 }, "type": "chat" }, { - "id": "claude-4.5-haiku", - "name": "Anthropic: Claude 4.5 Haiku", - "display_name": "Anthropic: Claude 4.5 Haiku", + "id": "openai/gpt-4o-search", + "name": "GPT-4o-Search", + "display_name": "GPT-4o-Search", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 128000, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-10", - "release_date": "2025-10-01", - "last_updated": "2025-10-01", + "release_date": "2025-03-11", + "last_updated": "2025-03-11", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.09999999999999999, - "cache_write": 1.25 + "input": 2.2, + "output": 9 }, "type": "chat" }, { - "id": "kimi-k2-0711", - "name": "Kimi K2 (07/11)", - "display_name": "Kimi K2 (07/11)", + "id": "openai/gpt-5.1-codex-max", + "name": "GPT-5.1-Codex-Max", + "display_name": "GPT-5.1-Codex-Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.5700000000000001, - "output": 2.3 + "input": 1.1, + "output": 9, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "o4-mini", - "name": "OpenAI o4 Mini", - "display_name": "OpenAI o4 Mini", + "id": "openai/gpt-5.4-pro", + "name": "GPT-5.4-Pro", + "display_name": "GPT-5.4-Pro", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1050000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -83359,8 +86399,14 @@ "supported": true, "default_enabled": true, "mode": "effort", - "effort": "medium", + "effort": "high", "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -83368,22 +86414,20 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.275 + "input": 27, + "output": 160 }, "type": "chat" }, { - "id": "sonar-deep-research", - "name": "Perplexity Sonar Deep Research", - "display_name": "Perplexity Sonar Deep Research", + "id": "openai/o4-mini-deep-research", + "name": "o4-mini-deep-research", + "display_name": "o4-mini-deep-research", "modalities": { "input": [ "text" @@ -83393,30 +86437,44 @@ ] }, "limit": { - "context": 127000, - "output": 4096 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2025-01-27", + "release_date": "2025-06-27", + "last_updated": "2025-06-27", "cost": { - "input": 2, - "output": 8 + "input": 1.8, + "output": 7.2, + "cache_read": 0.45 }, "type": "chat" }, { - "id": "gemma-3-12b-it", - "name": "Google Gemma 3 12B", - "display_name": "Google Gemma 3 12B", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1-nano", + "display_name": "GPT-4.1-nano", "modalities": { "input": [ "text", @@ -83427,29 +86485,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1047576, + "output": 32768 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.049999999999999996, - "output": 0.09999999999999999 + "input": 0.09, + "output": 0.36, + "cache_read": 0.022 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Google Gemini 2.5 Flash", - "display_name": "Google Gemini 2.5 Flash", + "id": "openai/o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ "text", @@ -83460,10 +86518,10 @@ ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -83473,79 +86531,93 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.3 + "input": 0.99, + "output": 4, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "deepseek-tng-r1t2-chimera", - "name": "DeepSeek TNG R1T2 Chimera", - "display_name": "DeepSeek TNG R1T2 Chimera", + "id": "openai/gpt-5.1-codex", + "name": "GPT-5.1-Codex", + "display_name": "GPT-5.1-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 130000, - "output": 163840 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-02", - "last_updated": "2025-07-02", + "release_date": "2025-11-12", + "last_updated": "2025-11-12", "cost": { - "input": 0.3, - "output": 1.2 + "input": 1.1, + "output": 9, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "gpt-5.1-codex-mini", - "name": "OpenAI: GPT-5.1 Codex Mini", - "display_name": "OpenAI: GPT-5.1 Codex Mini", + "id": "openai/gpt-5.2-codex", + "name": "GPT-5.2-Codex", + "display_name": "GPT-5.2-Codex", "modalities": { "input": [ "text", "image" ], "output": [ - "text", - "image" + "text" ] }, "limit": { @@ -83556,19 +86628,19 @@ "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -83579,22 +86651,21 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.024999999999999998 + "input": 1.6, + "output": 13, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "claude-sonnet-4", - "name": "Anthropic: Claude Sonnet 4", - "display_name": "Anthropic: Claude Sonnet 4", + "id": "openai/gpt-5-chat", + "name": "GPT-5-Chat", + "display_name": "GPT-5-Chat", "modalities": { "input": [ "text", @@ -83605,78 +86676,64 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-14", - "last_updated": "2025-05-14", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.30000000000000004, - "cache_write": 3.75 + "input": 1.1, + "output": 9, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "grok-code-fast-1", - "name": "xAI Grok Code Fast 1", - "display_name": "xAI Grok Code Fast 1", + "id": "openai/gpt-image-1", + "name": "GPT-Image-1", + "display_name": "GPT-Image-1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 128000, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-25", - "last_updated": "2024-08-25", - "cost": { - "input": 0.19999999999999998, - "output": 1.5, - "cache_read": 0.02 - }, - "type": "chat" + "release_date": "2025-03-31", + "last_updated": "2025-03-31", + "type": "imageGeneration" }, { - "id": "gpt-5.1", - "name": "OpenAI GPT-5.1", - "display_name": "OpenAI GPT-5.1", + "id": "openai/gpt-5-mini", + "name": "GPT-5-mini", + "display_name": "GPT-5-mini", "modalities": { "input": [ "text", "image" ], "output": [ - "text", - "image" + "text" ] }, "limit": { @@ -83687,16 +86744,16 @@ "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", + "minimal", "low", "medium", "high" @@ -83710,66 +86767,68 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-06-25", + "last_updated": "2025-06-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 + "input": 0.22, + "output": 1.8, + "cache_read": 0.022 }, "type": "chat" }, { - "id": "deepseek-reasoner", - "name": "DeepSeek Reasoner", - "display_name": "DeepSeek Reasoner", + "id": "openai/o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.56, - "output": 1.68, - "cache_read": 0.07 + "input": 0.99, + "output": 4 }, "type": "chat" }, { - "id": "grok-4-fast-reasoning", - "name": "xAI: Grok 4 Fast Reasoning", - "display_name": "xAI: Grok 4 Fast Reasoning", + "id": "openai/gpt-5.3-codex", + "name": "GPT-5.3-Codex", + "display_name": "GPT-5.3-Codex", "modalities": { "input": [ "text", @@ -83780,10 +86839,10 @@ ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -83791,28 +86850,44 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-01", - "last_updated": "2025-09-01", + "release_date": "2026-02-10", + "last_updated": "2026-02-10", "cost": { - "input": 0.19999999999999998, - "output": 0.5, - "cache_read": 0.049999999999999996 + "input": 1.6, + "output": 13, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "o1", - "name": "OpenAI: o1", - "display_name": "OpenAI: o1", + "id": "openai/o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -83823,7 +86898,7 @@ "output": 100000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -83842,22 +86917,21 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 1.8, + "output": 7.2, + "cache_read": 0.45 }, "type": "chat" }, { - "id": "llama-3.1-8b-instant", - "name": "Meta Llama 3.1 8B Instant", - "display_name": "Meta Llama 3.1 8B Instant", + "id": "openai/o3-deep-research", + "name": "o3-deep-research", + "display_name": "o3-deep-research", "modalities": { "input": [ "text" @@ -83867,40 +86941,112 @@ ] }, "limit": { - "context": 131072, - "output": 32678 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "release_date": "2025-06-27", + "last_updated": "2025-06-27", "cost": { - "input": 0.049999999999999996, - "output": 0.08 + "input": 9, + "output": 36, + "cache_read": 2.2 }, "type": "chat" }, { - "id": "o3-mini", - "name": "OpenAI o3 Mini", - "display_name": "OpenAI o3 Mini", + "id": "openai/gpt-5.2-instant", + "name": "GPT-5.2-Instant", + "display_name": "GPT-5.2-Instant", "modalities": { "input": [ + "text", + "image" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 1.6, + "output": 13, + "cache_read": 0.16 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", + "modalities": { + "input": [ + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -83915,6 +87061,13 @@ "mode": "effort", "effort": "medium", "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -83922,22 +87075,21 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2023-10-01", - "last_updated": "2023-10-01", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "output": 9, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "sonar", - "name": "Perplexity Sonar", - "display_name": "Perplexity Sonar", + "id": "cerebras/llama-3.3-70b-cs", + "name": "llama-3.3-70b-cs", + "display_name": "llama-3.3-70b-cs", "modalities": { "input": [ "text" @@ -83947,29 +87099,24 @@ ] }, "limit": { - "context": 127000, - "output": 4096 + "context": 8192, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2025-01-27", - "cost": { - "input": 1, - "output": 1 - }, + "release_date": "2025-05-13", + "last_updated": "2025-05-13", "type": "chat" }, { - "id": "kimi-k2-0905", - "name": "Kimi K2 (09/05)", - "display_name": "Kimi K2 (09/05)", + "id": "cerebras/llama-3.1-8b-cs", + "name": "Llama-3.1-8B-CS", + "display_name": "Llama-3.1-8B-CS", "modalities": { "input": [ "text" @@ -83979,34 +87126,31 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 128000, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "release_date": "2025-05-13", + "last_updated": "2025-05-13", "cost": { - "input": 0.5, - "output": 2, - "cache_read": 0.39999999999999997 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "mistral-small", - "name": "Mistral Small", - "display_name": "Mistral Small", + "id": "cerebras/gpt-oss-120b-cs", + "name": "GPT-OSS-120B-CS", + "display_name": "GPT-OSS-120B-CS", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -84014,72 +87158,56 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 8192 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-02", - "release_date": "2024-02-26", - "last_updated": "2024-02-26", + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "cost": { - "input": 75, - "output": 200 + "input": 0.35, + "output": 0.75 }, "type": "chat" }, { - "id": "qwen3-30b-a3b", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "cerebras/qwen3-235b-2507-cs", + "name": "qwen3-235b-2507-cs", + "display_name": "qwen3-235b-2507-cs", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 41000, - "output": 41000 + "context": 8192, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-06-01", - "last_updated": "2025-06-01", - "cost": { - "input": 0.08, - "output": 0.29 - }, + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "type": "chat" }, { - "id": "grok-4", - "name": "xAI Grok 4", - "display_name": "xAI Grok 4", + "id": "cerebras/qwen3-32b-cs", + "name": "qwen3-32b-cs", + "display_name": "qwen3-32b-cs", "modalities": { "input": [ "text" @@ -84089,179 +87217,140 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 8192, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-09", - "last_updated": "2024-07-09", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 - }, + "release_date": "2025-05-15", + "last_updated": "2025-05-15", "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking", - "name": "Qwen3 235B A22B Thinking", - "display_name": "Qwen3 235B A22B Thinking", + "id": "runwayml/runway-gen-4-turbo", + "name": "Runway-Gen-4-Turbo", + "display_name": "Runway-Gen-4-Turbo", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 262144, - "output": 81920 + "context": 256, + "output": 8192 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", - "cost": { - "input": 0.3, - "output": 2.9000000000000004 - }, + "release_date": "2025-05-09", + "last_updated": "2025-05-09", "type": "chat" }, { - "id": "qwen2.5-coder-7b-fast", - "name": "Qwen2.5 Coder 7B fast", - "display_name": "Qwen2.5 Coder 7B fast", + "id": "runwayml/runway", + "name": "Runway", + "display_name": "Runway", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 32000, + "context": 256, "output": 8192 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-09-15", - "last_updated": "2024-09-15", - "cost": { - "input": 0.03, - "output": 0.09 - }, + "release_date": "2024-10-11", + "last_updated": "2024-10-11", "type": "chat" }, { - "id": "llama-3.1-8b-instruct-turbo", - "name": "Meta Llama 3.1 8B Instruct Turbo", - "display_name": "Meta Llama 3.1 8B Instruct Turbo", + "id": "stabilityai/stablediffusionxl", + "name": "StableDiffusionXL", + "display_name": "StableDiffusionXL", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 200, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 0.02, - "output": 0.03 - }, + "release_date": "2023-07-09", + "last_updated": "2023-07-09", "type": "chat" }, { - "id": "qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "empiriolabs/deepseek-v4-flash-el", + "name": "DeepSeek-V4-Flash-EL", + "display_name": "DeepSeek-V4-Flash-EL", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 16384 + "context": 1000000, + "output": 384000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-24", + "last_updated": "2026-05-02", "cost": { "input": 0.14, - "output": 1.4 + "output": 0.28 }, "type": "chat" }, { - "id": "glm-4.6", - "name": "Zai GLM-4.6", - "display_name": "Zai GLM-4.6", + "id": "empiriolabs/deepseek-v4-pro-el", + "name": "DeepSeek-V4-Pro-EL", + "display_name": "DeepSeek-V4-Pro-EL", "modalities": { "input": [ "text" @@ -84271,443 +87360,486 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1000000, + "output": 384000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-24", + "last_updated": "2026-05-02", "cost": { - "input": 0.44999999999999996, - "output": 1.5 + "input": 1.67, + "output": 3.33 }, "type": "chat" }, { - "id": "gpt-5-codex", - "name": "OpenAI: GPT-5 Codex", - "display_name": "OpenAI: GPT-5 Codex", + "id": "anthropic/claude-sonnet-4.6", + "name": "Claude-Sonnet-4.6", + "display_name": "Claude-Sonnet-4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 983040, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, "effort": "medium", "effort_options": [ - "minimal", "low", "medium", "high" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 }, "type": "chat" }, { - "id": "claude-opus-4-1-20250805", - "name": "Anthropic: Claude Opus 4.1 (20250805)", - "display_name": "Anthropic: Claude Opus 4.1 (20250805)", + "id": "anthropic/claude-sonnet-4.5", + "name": "Claude-Sonnet-4.5", + "display_name": "Claude-Sonnet-4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 983040, + "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-08", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-09-26", + "last_updated": "2025-09-26", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 }, "type": "chat" }, { - "id": "gpt-5.1-chat-latest", - "name": "OpenAI GPT-5.1 Chat", - "display_name": "OpenAI GPT-5.1 Chat", + "id": "anthropic/claude-opus-4.6", + "name": "Claude-Opus-4.6", + "display_name": "Claude-Opus-4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 983040, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2026-02-04", + "last_updated": "2026-02-04", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 + "input": 4.3, + "output": 21, + "cache_read": 0.43, + "cache_write": 5.3 }, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "Anthropic: Claude 4.5 Haiku (20251001)", - "display_name": "Anthropic: Claude 4.5 Haiku (20251001)", + "id": "anthropic/claude-haiku-3", + "name": "Claude-Haiku-3", + "display_name": "Claude-Haiku-3", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 189096, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-10", - "release_date": "2025-10-01", - "last_updated": "2025-10-01", + "release_date": "2024-03-09", + "last_updated": "2024-03-09", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.09999999999999999, - "cache_write": 1.25 + "input": 0.21, + "output": 1.1, + "cache_read": 0.021, + "cache_write": 0.26 }, "type": "chat" }, { - "id": "sonar-reasoning", - "name": "Perplexity Sonar Reasoning", - "display_name": "Perplexity Sonar Reasoning", + "id": "anthropic/claude-opus-4.1", + "name": "Claude-Opus-4.1", + "display_name": "Claude-Opus-4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 127000, - "output": 4096 + "context": 196608, + "output": 32000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2025-01-27", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1, - "output": 5 + "input": 13, + "output": 64, + "cache_read": 1.3, + "cache_write": 16 }, "type": "chat" }, { - "id": "claude-opus-4", - "name": "Anthropic: Claude Opus 4", - "display_name": "Anthropic: Claude Opus 4", + "id": "anthropic/claude-sonnet-3.5-june", + "name": "Claude-Sonnet-3.5-June", + "display_name": "Claude-Sonnet-3.5-June", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 189096, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-14", - "last_updated": "2025-05-14", + "release_date": "2024-11-18", + "last_updated": "2024-11-18", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 }, "type": "chat" }, { - "id": "llama-prompt-guard-2-86m", - "name": "Meta Llama Prompt Guard 2 86M", - "display_name": "Meta Llama Prompt Guard 2 86M", + "id": "anthropic/claude-opus-4", + "name": "Claude-Opus-4", + "display_name": "Claude-Opus-4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 512, - "output": 2 + "context": 192512, + "output": 28672 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "release_date": "2025-05-21", + "last_updated": "2025-05-21", "cost": { - "input": 0.01, - "output": 0.01 + "input": 13, + "output": 64, + "cache_read": 1.3, + "cache_write": 16 }, "type": "chat" }, { - "id": "gpt-4.1-nano", - "name": "OpenAI GPT-4.1 Nano", - "display_name": "OpenAI GPT-4.1 Nano", + "id": "anthropic/claude-haiku-4.5", + "name": "Claude-Haiku-4.5", + "display_name": "Claude-Haiku-4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 192000, + "output": 64000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.09999999999999999, - "output": 0.39999999999999997, - "cache_read": 0.024999999999999998 + "input": 0.85, + "output": 4.3, + "cache_read": 0.085, + "cache_write": 1.1 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "anthropic/claude-sonnet-3.7", + "name": "Claude-Sonnet-3.7", + "display_name": "Claude-Sonnet-3.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 196608, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-31", - "last_updated": "2025-07-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.09999999999999999, - "output": 0.3 + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 }, "type": "chat" }, { - "id": "claude-3.5-haiku", - "name": "Anthropic: Claude 3.5 Haiku", - "display_name": "Anthropic: Claude 3.5 Haiku", + "id": "anthropic/claude-haiku-3.5", + "name": "Claude-Haiku-3.5", + "display_name": "Claude-Haiku-3.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 189096, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 0.7999999999999999, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 0.68, + "output": 3.4, + "cache_read": 0.068, + "cache_write": 0.85 }, "type": "chat" }, { - "id": "grok-3-mini", - "name": "xAI Grok 3 Mini", - "display_name": "xAI Grok 3 Mini", + "id": "anthropic/claude-opus-4.5", + "name": "Claude-Opus-4.5", + "display_name": "Claude-Opus-4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 196608, + "output": 64000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2025-11-21", + "last_updated": "2025-11-21", "cost": { - "input": 0.3, - "output": 0.5, - "cache_read": 0.075 + "input": 4.3, + "output": 21, + "cache_read": 0.43, + "cache_write": 5.3 }, "type": "chat" }, { - "id": "o3", - "name": "OpenAI o3", - "display_name": "OpenAI o3", + "id": "anthropic/claude-sonnet-4", + "name": "Claude-Sonnet-4", + "display_name": "Claude-Sonnet-4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 983040, + "output": 64000 }, "temperature": false, "tool_call": true, @@ -84715,362 +87847,326 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2025-05-21", + "last_updated": "2025-05-21", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "anthropic/claude-opus-4.7", + "name": "Claude-Opus-4.7", + "display_name": "Claude-Opus-4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 1048576, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "release_date": "2026-04-15", + "last_updated": "2026-04-15", "cost": { - "input": 0.27, - "output": 0.41 + "input": 4.3, + "output": 21, + "cache_read": 0.43, + "cache_write": 5.4 }, "type": "chat" }, { - "id": "gpt-oss-20b", - "name": "OpenAI GPT-OSS 20b", - "display_name": "OpenAI GPT-OSS 20b", + "id": "anthropic/claude-sonnet-3.5", + "name": "Claude-Sonnet-3.5", + "display_name": "Claude-Sonnet-3.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 189096, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2024-06-05", + "last_updated": "2024-06-05", "cost": { - "input": 0.049999999999999996, - "output": 0.19999999999999998 + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 }, "type": "chat" }, { - "id": "gpt-5-pro", - "name": "OpenAI: GPT-5 Pro", - "display_name": "OpenAI: GPT-5 Pro", + "id": "elevenlabs/elevenlabs-v3", + "name": "ElevenLabs-v3", + "display_name": "ElevenLabs-v3", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { "context": 128000, - "output": 32768 + "output": 8192 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 15, - "output": 120 - }, + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "type": "chat" }, { - "id": "llama-guard-4", - "name": "Meta Llama Guard 4 12B", - "display_name": "Meta Llama Guard 4 12B", + "id": "elevenlabs/elevenlabs-music", + "name": "ElevenLabs-Music", + "display_name": "ElevenLabs-Music", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 131072, - "output": 1024 + "context": 2000, + "output": 8192 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0.21, - "output": 0.21 - }, + "release_date": "2025-08-29", + "last_updated": "2025-08-29", "type": "chat" }, { - "id": "gpt-4o", - "name": "OpenAI GPT-4o", - "display_name": "OpenAI GPT-4o", + "id": "elevenlabs/elevenlabs-v2.5-turbo", + "name": "ElevenLabs-v2.5-Turbo", + "display_name": "ElevenLabs-v2.5-Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "audio" ] }, "limit": { "context": 128000, - "output": 16384 + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", - "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 - }, + "release_date": "2024-10-28", + "last_updated": "2024-10-28", "type": "chat" }, { - "id": "qwen3-vl-235b-a22b-instruct", - "name": "Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen3 VL 235B A22B Instruct", + "id": "novita/minimax-m2.1", + "name": "minimax-m2.1", + "display_name": "minimax-m2.1", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 205000, + "output": 131072 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", - "cost": { - "input": 0.3, - "output": 1.5 + "extra_capabilities": { + "reasoning": { + "supported": true + } }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-26", + "last_updated": "2025-12-26", "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "Google Gemini 2.5 Flash Lite", - "display_name": "Google Gemini 2.5 Flash Lite", + "id": "novita/kimi-k2.5", + "name": "Kimi-K2.5", + "display_name": "Kimi-K2.5", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 128000, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-22", - "last_updated": "2025-07-22", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.09999999999999999, - "output": 0.39999999999999997, - "cache_read": 0.024999999999999998, - "cache_write": 0.09999999999999999 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "qwen3-coder", - "name": "Qwen3 Coder 480B A35B Instruct Turbo", - "display_name": "Qwen3 Coder 480B A35B Instruct Turbo", + "id": "novita/deepseek-v3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.22, - "output": 0.95 + "input": 0.27, + "output": 0.4, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "gpt-5", - "name": "OpenAI GPT-5", - "display_name": "OpenAI GPT-5", + "id": "novita/glm-4.7-n", + "name": "glm-4.7-n", + "display_name": "glm-4.7-n", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 205000, + "output": 131072 }, "temperature": false, "tool_call": true, @@ -85078,43 +88174,16 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 - }, + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "type": "chat" }, { - "id": "ernie-4.5-21b-a3b-thinking", - "name": "Baidu Ernie 4.5 21B A3B Thinking", - "display_name": "Baidu Ernie 4.5 21B A3B Thinking", + "id": "novita/glm-4.7-flash", + "name": "glm-4.7-flash", + "display_name": "glm-4.7-flash", "modalities": { "input": [ "text" @@ -85124,30 +88193,30 @@ ] }, "limit": { - "context": 128000, - "output": 8000 + "context": 200000, + "output": 65500 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-03-16", - "last_updated": "2025-03-16", - "cost": { - "input": 0.07, - "output": 0.28 + "extra_capabilities": { + "reasoning": { + "supported": true + } }, + "attachment": true, + "open_weights": false, + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "OpenAI GPT-OSS 120b", - "display_name": "OpenAI GPT-OSS 120b", + "id": "novita/glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -85157,81 +88226,79 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 8192, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", - "cost": { - "input": 0.04, - "output": 0.16 - }, + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "type": "chat" }, { - "id": "gpt-5-chat-latest", - "name": "OpenAI GPT-5 Chat Latest", - "display_name": "OpenAI GPT-5 Chat Latest", + "id": "novita/kimi-k2-thinking", + "name": "kimi-k2-thinking", + "display_name": "kimi-k2-thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 256000, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-09-30", - "last_updated": "2024-09-30", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-07", + "last_updated": "2025-11-07", "type": "chat" }, { - "id": "claude-4.5-sonnet", - "name": "Anthropic: Claude Sonnet 4.5", - "display_name": "Anthropic: Claude Sonnet 4.5", + "id": "novita/glm-4.7", + "name": "glm-4.7", + "display_name": "glm-4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 205000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -85239,23 +88306,27 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.30000000000000004, - "cache_write": 3.75 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "type": "chat" }, { - "id": "deepseek-v3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "novita/glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -85265,62 +88336,82 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 205000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-26", - "last_updated": "2024-12-26", + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 0.56, - "output": 1.68, - "cache_read": 0.07 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "llama-3.1-8b-instruct", - "name": "Meta Llama 3.1 8B Instruct", - "display_name": "Meta Llama 3.1 8B Instruct", + "id": "novita/kimi-k2.6", + "name": "Kimi-K2.6", + "display_name": "Kimi-K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-04-20", + "last_updated": "2026-05-02", "cost": { - "input": 0.02, - "output": 0.049999999999999996 + "input": 0.96, + "output": 4.04, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "OpenAI GPT-4.1", - "display_name": "OpenAI GPT-4.1", + "id": "novita/glm-4.6v", + "name": "glm-4.6v", + "display_name": "glm-4.6v", "modalities": { "input": [ "text", @@ -85331,235 +88422,198 @@ ] }, "limit": { - "context": 1047576, + "context": 131000, "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "google/veo-3.1-fast", + "name": "Veo-3.1-Fast", + "display_name": "Veo-3.1-Fast", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 256000, - "output": 262144 + "context": 480, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", - "cost": { - "input": 0.48, - "output": 2 - }, + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "OpenAI GPT-4.1 Mini", - "display_name": "OpenAI GPT-4.1 Mini", + "id": "google/imagen-4-fast", + "name": "Imagen-4-Fast", + "display_name": "Imagen-4-Fast", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 480, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 0.39999999999999997, - "output": 1.5999999999999999, - "cache_read": 0.09999999999999999 - }, + "release_date": "2025-06-25", + "last_updated": "2025-06-25", "type": "chat" }, { - "id": "deepseek-v3.1-terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", + "id": "google/veo-3-fast", + "name": "Veo-3-Fast", + "display_name": "Veo-3-Fast", "modalities": { "input": [ "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 480, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", - "cost": { - "input": 0.27, - "output": 1, - "cache_read": 0.21600000000000003 - }, + "release_date": "2025-10-13", + "last_updated": "2025-10-13", "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "OpenAI: GPT-5.1 Codex", - "display_name": "OpenAI: GPT-5.1 Codex", + "id": "google/nano-banana-pro", + "name": "Nano-Banana-Pro", + "display_name": "Nano-Banana-Pro", "modalities": { "input": [ "text", "image" ], "output": [ - "text", "image" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 65536, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 + "input": 2, + "output": 12, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "grok-3", - "name": "xAI Grok 3", - "display_name": "xAI Grok 3", + "id": "google/gemini-3-pro", + "name": "Gemini-3-Pro", + "display_name": "Gemini-3-Pro", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 65536 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2025-10-22", + "last_updated": "2025-10-22", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 1.6, + "output": 9.6, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "grok-4-fast-non-reasoning", - "name": "xAI Grok 4 Fast Non-Reasoning", - "display_name": "xAI Grok 4 Fast Non-Reasoning", + "id": "google/gemini-3.1-flash-lite", + "name": "Gemini-3.1-Flash-Lite", + "display_name": "Gemini-3.1-Flash-Lite", "modalities": { "input": [ "text", "image", + "video", "audio" ], "output": [ @@ -85567,85 +88621,84 @@ ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 1048576, + "output": 65536 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "release_date": "2026-02-18", + "last_updated": "2026-02-18", "cost": { - "input": 0.19999999999999998, - "output": 0.5, - "cache_read": 0.049999999999999996 + "input": 0.25, + "output": 1.5 }, "type": "chat" }, { - "id": "sonar-reasoning-pro", - "name": "Perplexity Sonar Reasoning Pro", - "display_name": "Perplexity Sonar Reasoning Pro", + "id": "google/nano-banana", + "name": "Nano-Banana", + "display_name": "Nano-Banana", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 127000, - "output": 4096 + "context": 65536, + "output": 8192 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2025-01-27", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 2, - "output": 8 + "input": 0.21, + "output": 1.8, + "cache_read": 0.021 }, "type": "chat" - } - ] - }, - "zai-coding-plan": { - "id": "zai-coding-plan", - "name": "Z.AI Coding Plan", - "display_name": "Z.AI Coding Plan", - "api": "https://api.z.ai/api/coding/paas/v4", - "doc": "https://docs.z.ai/devpack/overview", - "models": [ + }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "google/gemini-2.5-pro", + "name": "Gemini-2.5-Pro", + "display_name": "Gemini-2.5-Pro", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1065535, + "output": 65535 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -85654,172 +88707,222 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "attachment": true, + "open_weights": false, + "release_date": "2025-02-05", + "last_updated": "2025-02-05", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.87, + "output": 7, + "cache_read": 0.087 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "google/veo-3.1", + "name": "Veo-3.1", + "display_name": "Veo-3.1", "modalities": { "input": [ "text" ], "output": [ + "video" + ] + }, + "limit": { + "context": 480, + "output": 8192 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "type": "chat" + }, + { + "id": "google/imagen-3", + "name": "Imagen-3", + "display_name": "Imagen-3", + "modalities": { + "input": [ "text" + ], + "output": [ + "image" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 480, + "output": 8192 }, - "temperature": true, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-10-15", + "last_updated": "2024-10-15", + "type": "chat" + }, + { + "id": "google/gemini-2.5-flash-lite", + "name": "Gemini-2.5-Flash-Lite", + "display_name": "Gemini-2.5-Flash-Lite", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1024000, + "output": 64000 + }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "release_date": "2025-06-19", + "last_updated": "2025-06-19", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "google/gemini-2.0-flash-lite", + "name": "Gemini-2.0-Flash-Lite", + "display_name": "Gemini-2.0-Flash-Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 990000, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "release_date": "2025-02-05", + "last_updated": "2025-02-05", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.052, + "output": 0.21 }, "type": "chat" }, { - "id": "glm-5-turbo", - "name": "GLM-5-Turbo", - "display_name": "GLM-5-Turbo", + "id": "google/veo-3", + "name": "Veo-3", + "display_name": "Veo-3", "modalities": { "input": [ "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 480, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, + "release_date": "2025-05-21", + "last_updated": "2025-05-21", "type": "chat" }, { - "id": "glm-5v-turbo", - "name": "GLM-5V-Turbo", - "display_name": "GLM-5V-Turbo", + "id": "google/gemini-3-flash", + "name": "Gemini-3-Flash", + "display_name": "Gemini-3-Flash", "modalities": { "input": [ "text", "image", "video", - "pdf" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 1048576, + "output": 65536 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -85828,259 +88931,242 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "release_date": "2025-10-07", + "last_updated": "2025-10-07", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.4, + "output": 2.4, + "cache_read": 0.04 }, "type": "chat" - } - ] - }, - "amazon-bedrock": { - "id": "amazon-bedrock", - "name": "Amazon Bedrock", - "display_name": "Amazon Bedrock", - "doc": "https://docs.aws.amazon.com/bedrock/latest/userguide/models-supported.html", - "models": [ + }, { - "id": "openai.gpt-oss-safeguard-120b", - "name": "GPT OSS Safeguard 120B", - "display_name": "GPT OSS Safeguard 120B", + "id": "google/gemini-deep-research", + "name": "gemini-deep-research", + "display_name": "gemini-deep-research", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1048576, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.15, - "output": 0.6 + "input": 1.6, + "output": 9.6 }, "type": "chat" }, { - "id": "nvidia.nemotron-nano-3-30b", - "name": "NVIDIA Nemotron Nano 3 30B", - "display_name": "NVIDIA Nemotron Nano 3 30B", + "id": "google/gemini-2.5-flash", + "name": "Gemini-2.5-Flash", + "display_name": "Gemini-2.5-Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1065535, + "output": 65535 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-04-26", + "last_updated": "2025-04-26", "cost": { - "input": 0.06, - "output": 0.24 + "input": 0.21, + "output": 1.8, + "cache_read": 0.021 }, "type": "chat" }, { - "id": "nvidia.nemotron-super-3-120b", - "name": "NVIDIA Nemotron 3 Super 120B A12B", - "display_name": "NVIDIA Nemotron 3 Super 120B A12B", + "id": "google/veo-2", + "name": "Veo-2", + "display_name": "Veo-2", "modalities": { "input": [ "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 480, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-11", - "last_updated": "2026-03-11", - "cost": { - "input": 0.15, - "output": 0.65 + "supported": false }, + "attachment": true, + "open_weights": false, + "release_date": "2024-12-02", + "last_updated": "2024-12-02", "type": "chat" }, { - "id": "writer.palmyra-x5-v1:0", - "name": "Palmyra X5", - "display_name": "Palmyra X5", + "id": "google/lyria", + "name": "Lyria", + "display_name": "Lyria", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 1040000, + "context": 8192, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", - "cost": { - "input": 0.6, - "output": 6 - }, + "release_date": "2025-06-04", + "last_updated": "2025-06-04", "type": "chat" }, { - "id": "mistral.ministral-3-8b-instruct", - "name": "Ministral 3 8B", - "display_name": "Ministral 3 8B", + "id": "google/imagen-4-ultra", + "name": "Imagen-4-Ultra", + "display_name": "Imagen-4-Ultra", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 480, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", - "cost": { - "input": 0.15, - "output": 0.15 - }, + "release_date": "2025-05-24", + "last_updated": "2025-05-24", "type": "chat" }, { - "id": "au.anthropic.claude-opus-4-6-v1", - "name": "AU Anthropic Claude Opus 4.6", - "display_name": "AU Anthropic Claude Opus 4.6", + "id": "google/gemini-2.0-flash", + "name": "Gemini-2.0-Flash", + "display_name": "Gemini-2.0-Flash", "modalities": { "input": [ "text", "image", - "pdf" + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 990000, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 16.5, - "output": 82.5, - "cache_read": 1.65, - "cache_write": 20.625 + "input": 0.1, + "output": 0.42 }, "type": "chat" }, { - "id": "mistral.ministral-3-3b-instruct", - "name": "Ministral 3 3B", - "display_name": "Ministral 3 3B", + "id": "google/gemma-4-31b", + "name": "Gemma-4-31B", + "display_name": "Gemma-4-31B", "modalities": { "input": [ "text", @@ -86091,248 +89177,235 @@ ] }, "limit": { - "context": 256000, + "context": 262144, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "anthropic.claude-sonnet-4-5-20250929-v1:0", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "google/gemini-3.1-pro", + "name": "Gemini-3.1-Pro", + "display_name": "Gemini-3.1-Pro", "modalities": { "input": [ "text", "image", - "pdf" + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65536 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 2, + "output": 12, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "mistral.devstral-2-123b", - "name": "Devstral 2 123B", - "display_name": "Devstral 2 123B", + "id": "google/imagen-3-fast", + "name": "Imagen-3-Fast", + "display_name": "Imagen-3-Fast", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 256000, + "context": 480, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-17", - "last_updated": "2026-02-17", - "cost": { - "input": 0.4, - "output": 2 - }, + "attachment": true, + "open_weights": false, + "release_date": "2024-10-17", + "last_updated": "2024-10-17", "type": "chat" }, { - "id": "global.anthropic.claude-opus-4-5-20251101-v1:0", - "name": "Claude Opus 4.5 (Global)", - "display_name": "Claude Opus 4.5 (Global)", + "id": "google/imagen-4", + "name": "Imagen-4", + "display_name": "Imagen-4", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 480, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", - "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 - }, + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "type": "chat" }, { - "id": "mistral.voxtral-small-24b-2507", - "name": "Voxtral Small 24B 2507", - "display_name": "Voxtral Small 24B 2507", + "id": "trytako/tako", + "name": "Tako", + "display_name": "Tako", "modalities": { "input": [ - "text", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32000, + "context": 2048, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2025-07-01", - "cost": { - "input": 0.15, - "output": 0.35 - }, + "open_weights": false, + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "type": "chat" }, { - "id": "google.gemma-3-12b-it", - "name": "Google Gemma 3 12B", - "display_name": "Google Gemma 3 12B", + "id": "poetools/claude-code", + "name": "claude-code", + "display_name": "claude-code", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 8192, "output": 8192 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", - "cost": { - "input": 0.049999999999999996, - "output": 0.09999999999999999 - }, + "release_date": "2025-11-27", + "last_updated": "2025-11-27", "type": "chat" }, { - "id": "amazon.nova-pro-v1:0", - "name": "Nova Pro", - "display_name": "Nova Pro", + "id": "fireworks-ai/kimi-k2.5-fw", + "name": "Kimi-K2.5-FW", + "display_name": "Kimi-K2.5-FW", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 8192 + "context": 262144, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.8, - "output": 3.2, - "cache_read": 0.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "anthropic.claude-haiku-4-5-20251001-v1:0", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "xai/grok-3-mini", + "name": "Grok 3 Mini", + "display_name": "Grok 3 Mini", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -86340,114 +89413,96 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2025-04-11", + "last_updated": "2025-04-11", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.3, + "output": 0.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "minimax.minimax-m2", - "name": "MiniMax M2", - "display_name": "MiniMax M2", + "id": "xai/grok-4", + "name": "Grok-4", + "display_name": "Grok-4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204608, + "context": 256000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-07-10", + "last_updated": "2025-07-10", "cost": { - "input": 0.3, - "output": 1.2 + "input": 3, + "output": 15, + "cache_read": 0.75 }, "type": "chat" }, { - "id": "global.anthropic.claude-opus-4-7", - "name": "Claude Opus 4.7 (Global)", - "display_name": "Claude Opus 4.7 (Global)", + "id": "xai/grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 256000, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "release_date": "2025-08-22", + "last_updated": "2025-08-22", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "mistral.pixtral-large-2502-v1:0", - "name": "Pixtral Large (25.02)", - "display_name": "Pixtral Large (25.02)", + "id": "xai/grok-4.1-fast-reasoning", + "name": "Grok-4.1-Fast-Reasoning", + "display_name": "Grok-4.1-Fast-Reasoning", "modalities": { "input": [ "text", @@ -86458,28 +89513,25 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 2000000, + "output": 30000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-08", - "last_updated": "2025-04-08", - "cost": { - "input": 2, - "output": 6 - }, + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "type": "chat" }, { - "id": "meta.llama4-maverick-17b-instruct-v1:0", - "name": "Llama 4 Maverick 17B Instruct", - "display_name": "Llama 4 Maverick 17B Instruct", + "id": "xai/grok-4.1-fast-non-reasoning", + "name": "Grok-4.1-Fast-Non-Reasoning", + "display_name": "Grok-4.1-Fast-Non-Reasoning", "modalities": { "input": [ "text", @@ -86490,217 +89542,231 @@ ] }, "limit": { - "context": 1000000, - "output": 16384 + "context": 2000000, + "output": 30000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", - "cost": { - "input": 0.24, - "output": 0.97 - }, + "open_weights": false, + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "type": "chat" }, { - "id": "us.anthropic.claude-sonnet-4-5-20250929-v1:0", - "name": "Claude Sonnet 4.5 (US)", - "display_name": "Claude Sonnet 4.5 (US)", + "id": "xai/grok-4.20-multi-agent", + "name": "Grok-4.20-Multi-Agent", + "display_name": "Grok-4.20-Multi-Agent", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2026-03-13", + "last_updated": "2026-03-13", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, + "input": 2, + "output": 6, + "cache_read": 0.2 + }, "type": "chat" }, { - "id": "us.anthropic.claude-haiku-4-5-20251001-v1:0", - "name": "Claude Haiku 4.5 (US)", - "display_name": "Claude Haiku 4.5 (US)", + "id": "xai/grok-3", + "name": "Grok 3", + "display_name": "Grok 3", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2025-04-11", + "last_updated": "2025-04-11", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 3, + "output": 15, + "cache_read": 0.75 }, "type": "chat" }, { - "id": "amazon.nova-micro-v1:0", - "name": "Nova Micro", - "display_name": "Nova Micro", + "id": "xai/grok-4-fast-non-reasoning", + "name": "Grok-4-Fast-Non-Reasoning", + "display_name": "Grok-4-Fast-Non-Reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 2000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "release_date": "2025-09-16", + "last_updated": "2025-09-16", "cost": { - "input": 0.035, - "output": 0.14, - "cache_read": 0.00875 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "global.anthropic.claude-sonnet-4-5-20250929-v1:0", - "name": "Claude Sonnet 4.5 (Global)", - "display_name": "Claude Sonnet 4.5 (Global)", + "id": "xai/grok-4-fast-reasoning", + "name": "Grok-4-Fast-Reasoning", + "display_name": "Grok-4-Fast-Reasoning", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 2000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-09-16", + "last_updated": "2025-09-16", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "openai.gpt-oss-20b-1:0", - "name": "gpt-oss-20b", - "display_name": "gpt-oss-20b", + "id": "lumalabs/ray2", + "name": "Ray2", + "display_name": "Ray2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 5000, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", - "cost": { - "input": 0.07, - "output": 0.3 - }, + "release_date": "2025-02-20", + "last_updated": "2025-02-20", "type": "chat" }, { - "id": "zai.glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "topazlabs-co/topazlabs", + "name": "TopazLabs", + "display_name": "TopazLabs", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 202752, - "output": 101376 + "context": 204, + "output": 8192 }, - "temperature": true, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-12-03", + "last_updated": "2024-12-03", + "type": "chat" + }, + { + "id": "openai/gpt-5.5-pro", + "name": "GPT-5.5-Pro", + "display_name": "GPT-5.5-Pro", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text", + "image" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -86708,62 +89774,90 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-08", + "last_updated": "2026-04-08", "cost": { - "input": 1, - "output": 3.2 + "input": 27.2727, + "output": 163.6364 }, "type": "chat" }, { - "id": "qwen.qwen3-32b-v1:0", - "name": "Qwen3 32B (dense)", - "display_name": "Qwen3 32B (dense)", + "id": "openai/gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-08", + "last_updated": "2026-04-08", "cost": { - "input": 0.15, - "output": 0.6 + "input": 4.5455, + "output": 27.2727, + "cache_read": 0.4545 }, "type": "chat" - }, + } + ] + }, + "minimax": { + "id": "minimax", + "name": "MiniMax (minimax.io)", + "display_name": "MiniMax (minimax.io)", + "api": "https://api.minimax.io/anthropic/v1", + "doc": "https://platform.minimax.io/docs/guides/quickstart", + "models": [ { - "id": "deepseek.v3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -86773,8 +89867,8 @@ ] }, "limit": { - "context": 163840, - "output": 81920 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -86782,34 +89876,36 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2026-02-06", - "last_updated": "2026-02-06", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.62, - "output": 1.85 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "eu.anthropic.claude-haiku-4-5-20251001-v1:0", - "name": "Claude Haiku 4.5 (EU)", - "display_name": "Claude Haiku 4.5 (EU)", + "id": "MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -86817,23 +89913,33 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "zai.glm-4.7-flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -86843,7 +89949,7 @@ ] }, "limit": { - "context": 200000, + "context": 204800, "output": 131072 }, "temperature": true, @@ -86852,128 +89958,122 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.07, - "output": 0.4 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "us.anthropic.claude-opus-4-7", - "name": "Claude Opus 4.7 (US)", - "display_name": "Claude Opus 4.7 (US)", + "id": "MiniMax-M2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], "interleaved": true, "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "amazon.nova-2-lite-v1:0", - "name": "Nova 2 Lite", - "display_name": "Nova 2 Lite", + "id": "MiniMax-M2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "display_name": "MiniMax-M2.5-highspeed", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", "cost": { - "input": 0.33, - "output": 2.75 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "anthropic.claude-opus-4-5-20251101-v1:0", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 196608, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -86981,23 +90081,33 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.3, + "output": 1.2 }, "type": "chat" - }, + } + ] + }, + "groq": { + "id": "groq", + "name": "Groq", + "display_name": "Groq", + "doc": "https://console.groq.com/docs/models", + "models": [ { - "id": "qwen.qwen3-coder-480b-a35b-v1:0", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "gemma2-9b-it", + "name": "Gemma 2 9B", + "display_name": "Gemma 2 9B", "modalities": { "input": [ "text" @@ -87007,8 +90117,8 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -87017,54 +90127,51 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "knowledge": "2024-06", + "release_date": "2024-06-27", + "last_updated": "2024-06-27", "cost": { - "input": 0.22, - "output": 1.8 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "amazon.nova-lite-v1:0", - "name": "Nova Lite", - "display_name": "Nova Lite", + "id": "llama-3.1-8b-instant", + "name": "Llama 3.1 8B Instant", + "display_name": "Llama 3.1 8B Instant", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.06, - "output": 0.24, - "cache_read": 0.015 + "input": 0.05, + "output": 0.08 }, "type": "chat" }, { - "id": "meta.llama3-1-8b-instruct-v1:0", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "llama3-8b-8192", + "name": "Llama 3 8B", + "display_name": "Llama 3 8B", "modalities": { "input": [ "text" @@ -87074,8 +90181,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -87084,126 +90191,94 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2023-03", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 0.22, - "output": 0.22 + "input": 0.05, + "output": 0.08 }, "type": "chat" }, { - "id": "anthropic.claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "allam-2-7b", + "name": "ALLaM-2-7b", + "display_name": "ALLaM-2-7b", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 4096, + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2024-09", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google.gemma-3-27b-it", - "name": "Google Gemma 3 27B Instruct", - "display_name": "Google Gemma 3 27B Instruct", + "id": "mistral-saba-24b", + "name": "Mistral Saba 24B", + "display_name": "Mistral Saba 24B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 8192 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-27", - "last_updated": "2025-07-27", + "attachment": false, + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2025-02-06", + "last_updated": "2025-02-06", "cost": { - "input": 0.12, - "output": 0.2 + "input": 0.79, + "output": 0.79 }, "type": "chat" }, { - "id": "global.anthropic.claude-haiku-4-5-20251001-v1:0", - "name": "Claude Haiku 4.5 (Global)", - "display_name": "Claude Haiku 4.5 (Global)", + "id": "qwen-qwq-32b", + "name": "Qwen QwQ 32B", + "display_name": "Qwen QwQ 32B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -87211,35 +90286,32 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-09", + "release_date": "2024-11-27", + "last_updated": "2024-11-27", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.29, + "output": 0.39 }, "type": "chat" }, { - "id": "google.gemma-3-4b-it", - "name": "Gemma 3 4B IT", - "display_name": "Gemma 3 4B IT", + "id": "llama-3.3-70b-versatile", + "name": "Llama 3.3 70B Versatile", + "display_name": "Llama 3.3 70B Versatile", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -87247,52 +90319,52 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.04, - "output": 0.08 + "input": 0.59, + "output": 0.79 }, "type": "chat" }, { - "id": "meta.llama4-scout-17b-instruct-v1:0", - "name": "Llama 4 Scout 17B Instruct", - "display_name": "Llama 4 Scout 17B Instruct", + "id": "whisper-large-v3", + "name": "Whisper Large V3", + "display_name": "Whisper Large V3", "modalities": { "input": [ - "text", - "image" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 3500000, - "output": 16384 + "context": 448, + "output": 448 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2023-09", + "release_date": "2023-09-01", + "last_updated": "2025-09-05", "cost": { - "input": 0.17, - "output": 0.66 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek.v3-v1:0", - "name": "DeepSeek-V3.1", - "display_name": "DeepSeek-V3.1", + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ "text" @@ -87302,8 +90374,8 @@ ] }, "limit": { - "context": 163840, - "output": 81920 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -87311,54 +90383,57 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, "knowledge": "2024-07", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.58, - "output": 1.68 + "input": 0.75, + "output": 0.99 }, "type": "chat" }, { - "id": "mistral.magistral-small-2509", - "name": "Magistral Small 1.2", - "display_name": "Magistral Small 1.2", + "id": "llama-guard-3-8b", + "name": "Llama Guard 3 8B", + "display_name": "Llama Guard 3 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 40000 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "qwen.qwen3-next-80b-a3b", - "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "id": "llama3-70b-8192", + "name": "Llama 3 70B", + "display_name": "Llama 3 70B", "modalities": { "input": [ "text" @@ -87368,8 +90443,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -87377,63 +90452,52 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2023-03", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 0.14, - "output": 1.4 + "input": 0.59, + "output": 0.79 }, "type": "chat" }, { - "id": "zai.glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "whisper-large-v3-turbo", + "name": "Whisper Large v3 Turbo", + "display_name": "Whisper Large v3 Turbo", "modalities": { "input": [ - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 448, + "output": 448 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "moonshot.kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "moonshotai/kimi-k2-instruct-0905", + "name": "Kimi K2 Instruct 0905", + "display_name": "Kimi K2 Instruct 0905", "modalities": { "input": [ "text" @@ -87443,72 +90507,61 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.6, - "output": 2.5 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "us.anthropic.claude-opus-4-5-20251101-v1:0", - "name": "Claude Opus 4.5 (US)", - "display_name": "Claude Opus 4.5 (US)", + "id": "moonshotai/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "mistral.ministral-3-14b-instruct", - "name": "Ministral 14B 3.0", - "display_name": "Ministral 14B 3.0", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -87518,28 +90571,34 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "deepseek.r1-v1:0", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "openai/gpt-oss-safeguard-20b", + "name": "Safety GPT OSS 20B", + "display_name": "Safety GPT OSS 20B", "modalities": { "input": [ "text" @@ -87549,8 +90608,8 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -87559,23 +90618,22 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-29", + "open_weights": true, + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "cost": { - "input": 1.35, - "output": 5.4 + "input": 0.075, + "output": 0.3, + "cache_read": 0.037 }, "type": "chat" }, { - "id": "mistral.voxtral-mini-3b-2507", - "name": "Voxtral Mini 3B 2507", - "display_name": "Voxtral Mini 3B 2507", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "audio", "text" ], "output": [ @@ -87583,28 +90641,34 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.04, - "output": 0.04 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "openai.gpt-oss-120b-1:0", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "groq/compound", + "name": "Compound", + "display_name": "Compound", "modalities": { "input": [ "text" @@ -87614,121 +90678,127 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2025-09-04", + "release_date": "2025-09-04", + "last_updated": "2025-09-04", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "nvidia.nemotron-nano-12b-v2", - "name": "NVIDIA Nemotron Nano 12B v2 VL BF16", - "display_name": "NVIDIA Nemotron Nano 12B v2 VL BF16", + "id": "groq/compound-mini", + "name": "Compound Mini", + "display_name": "Compound Mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2025-09-04", + "release_date": "2025-09-04", + "last_updated": "2025-09-04", "cost": { - "input": 0.2, - "output": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "eu.anthropic.claude-opus-4-7", - "name": "Claude Opus 4.7 (EU)", - "display_name": "Claude Opus 4.7 (EU)", + "id": "canopylabs/orpheus-arabic-saudi", + "name": "Orpheus Arabic Saudi", + "display_name": "Orpheus Arabic Saudi", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 4000, + "output": 50000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "attachment": false, + "open_weights": false, + "knowledge": "2025-12-16", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", + "cost": { + "input": 40, + "output": 0 }, - "attachment": true, + "type": "chat" + }, + { + "id": "canopylabs/orpheus-v1-english", + "name": "Orpheus V1 English", + "display_name": "Orpheus V1 English", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "limit": { + "context": 4000, + "output": 50000 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2025-12-19", + "release_date": "2025-12-19", + "last_updated": "2025-12-19", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "minimax.minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "qwen/qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ "text" @@ -87738,8 +90808,8 @@ ] }, "limit": { - "context": 196608, - "output": 98304 + "context": 131072, + "output": 40960 }, "temperature": true, "tool_call": true, @@ -87747,20 +90817,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2024-11-08", + "release_date": "2024-12-23", + "last_updated": "2024-12-23", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.29, + "output": 0.59 }, "type": "chat" }, { - "id": "meta.llama3-3-70b-instruct-v1:0", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "meta-llama/llama-prompt-guard-2-22m", + "name": "Llama Prompt Guard 2 22M", + "display_name": "Llama Prompt Guard 2 22M", "modalities": { "input": [ "text" @@ -87770,40 +90852,41 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 512, + "output": 512 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 0.72, - "output": 0.72 + "input": 0.03, + "output": 0.03 }, "type": "chat" }, { - "id": "meta.llama3-1-70b-instruct-v1:0", - "name": "Llama 3.1 70B Instruct", - "display_name": "Llama 3.1 70B Instruct", + "id": "meta-llama/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B", + "display_name": "Llama 4 Scout 17B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -87812,93 +90895,84 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.72, - "output": 0.72 + "input": 0.11, + "output": 0.34 }, "type": "chat" }, { - "id": "eu.anthropic.claude-sonnet-4-5-20250929-v1:0", - "name": "Claude Sonnet 4.5 (EU)", - "display_name": "Claude Sonnet 4.5 (EU)", + "id": "meta-llama/llama-prompt-guard-2-86m", + "name": "Llama Prompt Guard 2 86M", + "display_name": "Llama Prompt Guard 2 86M", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 512, + "output": 512 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.04, + "output": 0.04 }, "type": "chat" }, { - "id": "eu.anthropic.claude-opus-4-5-20251101-v1:0", - "name": "Claude Opus 4.5 (EU)", - "display_name": "Claude Opus 4.5 (EU)", + "id": "meta-llama/llama-4-maverick-17b-128e-instruct", + "name": "Llama 4 Maverick 17B", + "display_name": "Llama 4 Maverick 17B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "attachment": false, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "moonshotai.kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "meta-llama/llama-guard-4-12b", + "name": "Llama Guard 4 12B", + "display_name": "Llama Guard 4 12B", "modalities": { "input": [ "text", @@ -87909,98 +90983,115 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 131072, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true - } + "attachment": false, + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "cost": { + "input": 0.2, + "output": 0.2 + }, + "type": "chat" + } + ] + }, + "xiaomi-token-plan-sgp": { + "id": "xiaomi-token-plan-sgp", + "name": "Xiaomi Token Plan (Singapore)", + "display_name": "Xiaomi Token Plan (Singapore)", + "api": "https://token-plan-sgp.xiaomimimo.com/v1", + "doc": "https://platform.xiaomimimo.com/#/docs", + "models": [ + { + "id": "mimo-v2-tts", + "name": "MiMo-V2-TTS", + "display_name": "MiMo-V2-TTS", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "limit": { + "context": 8192, + "output": 16384 + }, + "tool_call": false, + "reasoning": { + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-06", - "last_updated": "2026-02-06", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.6, - "output": 3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "au.anthropic.claude-sonnet-4-6", - "name": "AU Anthropic Claude Sonnet 4.6", - "display_name": "AU Anthropic Claude Sonnet 4.6", + "id": "mimo-v2.5", + "name": "MiMo-V2.5", + "display_name": "MiMo-V2.5", "modalities": { "input": [ "text", "image", - "pdf" + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 3.3, - "output": 16.5, - "cache_read": 0.33, - "cache_write": 4.125 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "openai.gpt-oss-safeguard-20b", - "name": "GPT OSS Safeguard 20B", - "display_name": "GPT OSS Safeguard 20B", + "id": "mimo-v2-pro", + "name": "MiMo-V2-Pro", + "display_name": "MiMo-V2-Pro", "modalities": { "input": [ "text" @@ -88010,28 +91101,42 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.07, - "output": 0.2 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "qwen.qwen3-coder-30b-a3b-v1:0", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "mimo-v2-flash", + "name": "MiMo-V2-Flash", + "display_name": "MiMo-V2-Flash", "modalities": { "input": [ "text" @@ -88042,28 +91147,41 @@ }, "limit": { "context": 262144, - "output": 131072 + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "open_weights": true, + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "minimax.minimax-m2.1", - "name": "MiniMax M2.1", - "display_name": "MiniMax M2.1", + "id": "mimo-v2.5-pro", + "name": "MiMo-V2.5-Pro", + "display_name": "MiMo-V2.5-Pro", "modalities": { "input": [ "text" @@ -88073,7 +91191,7 @@ ] }, "limit": { - "context": 204800, + "context": 1048576, "output": 131072 }, "temperature": true, @@ -88082,52 +91200,91 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "qwen.qwen3-vl-235b-a22b", - "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "id": "mimo-v2-omni", + "name": "MiMo-V2-Omni", + "display_name": "MiMo-V2-Omni", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.3, - "output": 1.5 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" - }, + } + ] + }, + "siliconflow-com": { + "id": "siliconflow-com", + "name": "SiliconFlow", + "display_name": "SiliconFlow", + "api": "https://api.siliconflow.com/v1", + "doc": "https://cloud.siliconflow.com/models", + "models": [ { - "id": "qwen.qwen3-coder-next", - "name": "Qwen3 Coder Next", - "display_name": "Qwen3 Coder Next", + "id": "deepseek-ai/DeepSeek-R1", + "name": "deepseek-ai/DeepSeek-R1", + "display_name": "deepseek-ai/DeepSeek-R1", "modalities": { "input": [ "text" @@ -88137,8 +91294,8 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, @@ -88146,20 +91303,31 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-06", - "last_updated": "2026-02-06", + "open_weights": false, + "release_date": "2025-05-28", + "last_updated": "2025-11-25", "cost": { - "input": 0.22, - "output": 1.8 + "input": 0.5, + "output": 2.18 }, "type": "chat" }, { - "id": "nvidia.nemotron-nano-9b-v2", - "name": "NVIDIA Nemotron Nano 9B v2", - "display_name": "NVIDIA Nemotron Nano 9B v2", + "id": "deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "deepseek-ai/DeepSeek-V3.1-Terminus", + "display_name": "deepseek-ai/DeepSeek-V3.1-Terminus", "modalities": { "input": [ "text" @@ -88169,60 +91337,61 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-09-29", + "last_updated": "2025-11-25", "cost": { - "input": 0.06, - "output": 0.23 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "mistral.mistral-large-3-675b-instruct", - "name": "Mistral Large 3", - "display_name": "Mistral Large 3", + "id": "deepseek-ai/DeepSeek-V3.1", + "name": "deepseek-ai/DeepSeek-V3.1", + "display_name": "deepseek-ai/DeepSeek-V3.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "open_weights": false, + "release_date": "2025-08-25", + "last_updated": "2025-11-25", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "qwen.qwen3-235b-a22b-2507-v1:0", - "name": "Qwen3 235B A22B 2507", - "display_name": "Qwen3 235B A22B 2507", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", "modalities": { "input": [ "text" @@ -88232,29 +91401,29 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "open_weights": false, + "release_date": "2025-01-20", + "last_updated": "2025-11-25", "cost": { - "input": 0.22, - "output": 0.88 + "input": 0.18, + "output": 0.18 }, "type": "chat" }, { - "id": "writer.palmyra-x4-v1:0", - "name": "Palmyra X4", - "display_name": "Palmyra X4", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", "modalities": { "input": [ "text" @@ -88264,8 +91433,8 @@ ] }, "limit": { - "context": 122880, - "output": 8192 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -88275,31 +91444,29 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "release_date": "2025-01-20", + "last_updated": "2025-11-25", "cost": { - "input": 2.5, - "output": 10 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "anthropic.claude-opus-4-1-20250805-v1:0", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "deepseek-ai/DeepSeek-V3.2-Exp", + "name": "deepseek-ai/DeepSeek-V3.2-Exp", + "display_name": "deepseek-ai/DeepSeek-V3.2-Exp", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, @@ -88307,23 +91474,20 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-10-10", + "last_updated": "2025-11-25", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.27, + "output": 0.41 }, "type": "chat" }, { - "id": "us.deepseek.r1-v1:0", - "name": "DeepSeek-R1 (US)", - "display_name": "DeepSeek-R1 (US)", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "deepseek-ai/DeepSeek-V3.2", + "display_name": "deepseek-ai/DeepSeek-V3.2", "modalities": { "input": [ "text" @@ -88333,8 +91497,8 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, @@ -88342,84 +91506,56 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-29", + "release_date": "2025-12-03", + "last_updated": "2025-12-03", "cost": { - "input": 1.35, - "output": 5.4 + "input": 0.27, + "output": 0.42 }, "type": "chat" }, { - "id": "eu.anthropic.claude-opus-4-6-v1", - "name": "Claude Opus 4.6 (EU)", - "display_name": "Claude Opus 4.6 (EU)", + "id": "deepseek-ai/DeepSeek-V3", + "name": "deepseek-ai/DeepSeek-V3", + "display_name": "deepseek-ai/DeepSeek-V3", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "release_date": "2024-12-26", + "last_updated": "2025-11-25", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "us.meta.llama4-maverick-17b-instruct-v1:0", - "name": "Llama 4 Maverick 17B Instruct (US)", - "display_name": "Llama 4 Maverick 17B Instruct (US)", + "id": "deepseek-ai/deepseek-vl2", + "name": "deepseek-ai/deepseek-vl2", + "display_name": "deepseek-ai/deepseek-vl2", "modalities": { "input": [ "text", @@ -88430,8 +91566,8 @@ ] }, "limit": { - "context": 1000000, - "output": 16384 + "context": 4000, + "output": 4000 }, "temperature": true, "tool_call": true, @@ -88439,70 +91575,61 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "release_date": "2024-12-13", + "last_updated": "2025-11-25", "cost": { - "input": 0.24, - "output": 0.97 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "au.anthropic.claude-haiku-4-5-20251001-v1:0", - "name": "Claude Haiku 4.5 (AU)", - "display_name": "Claude Haiku 4.5 (AU)", + "id": "moonshotai/Kimi-K2-Instruct", + "name": "moonshotai/Kimi-K2-Instruct", + "display_name": "moonshotai/Kimi-K2-Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2025-07-13", + "last_updated": "2025-11-25", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.58, + "output": 2.29 }, "type": "chat" }, { - "id": "jp.anthropic.claude-sonnet-4-5-20250929-v1:0", - "name": "Claude Sonnet 4.5 (JP)", - "display_name": "Claude Sonnet 4.5 (JP)", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "moonshotai/Kimi-K2-Thinking", + "display_name": "moonshotai/Kimi-K2-Thinking", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -88510,414 +91637,297 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-11-07", + "last_updated": "2025-11-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.55, + "output": 2.5 }, "type": "chat" }, { - "id": "anthropic.claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "moonshotai/Kimi-K2.6", + "name": "moonshotai/Kimi-K2.6", + "display_name": "moonshotai/Kimi-K2.6", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "jp.anthropic.claude-sonnet-4-6", - "name": "Claude Sonnet 4.6 (JP)", - "display_name": "Claude Sonnet 4.6 (JP)", + "id": "moonshotai/Kimi-K2.5", + "name": "moonshotai/Kimi-K2.5", + "display_name": "moonshotai/Kimi-K2.5", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.45, + "output": 2.25 }, "type": "chat" }, { - "id": "global.anthropic.claude-sonnet-4-6", - "name": "Claude Sonnet 4.6 (Global)", - "display_name": "Claude Sonnet 4.6 (Global)", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "moonshotai/Kimi-K2-Instruct-0905", + "display_name": "moonshotai/Kimi-K2-Instruct-0905", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "release_date": "2025-09-08", + "last_updated": "2025-11-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "us.anthropic.claude-sonnet-4-6", - "name": "Claude Sonnet 4.6 (US)", - "display_name": "Claude Sonnet 4.6 (US)", + "id": "openai/gpt-oss-20b", + "name": "openai/gpt-oss-20b", + "display_name": "openai/gpt-oss-20b", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 131000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "release_date": "2025-08-13", + "last_updated": "2025-11-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.04, + "output": 0.18 }, "type": "chat" }, { - "id": "global.anthropic.claude-opus-4-6-v1", - "name": "Claude Opus 4.6 (Global)", - "display_name": "Claude Opus 4.6 (Global)", + "id": "openai/gpt-oss-120b", + "name": "openai/gpt-oss-120b", + "display_name": "openai/gpt-oss-120b", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "release_date": "2025-08-13", + "last_updated": "2025-11-25", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.05, + "output": 0.45 }, "type": "chat" }, { - "id": "us.anthropic.claude-opus-4-6-v1", - "name": "Claude Opus 4.6 (US)", - "display_name": "Claude Opus 4.6 (US)", + "id": "zai-org/GLM-4.5-Air", + "name": "zai-org/GLM-4.5-Air", + "display_name": "zai-org/GLM-4.5-Air", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "attachment": false, + "open_weights": false, + "release_date": "2025-07-28", + "last_updated": "2025-11-25", + "cost": { + "input": 0.14, + "output": 0.86 }, - "attachment": true, + "type": "chat" + }, + { + "id": "zai-org/GLM-4.5", + "name": "zai-org/GLM-4.5", + "display_name": "zai-org/GLM-4.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131000, + "output": 131000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "release_date": "2025-07-28", + "last_updated": "2025-11-25", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "us.anthropic.claude-opus-4-1-20250805-v1:0", - "name": "Claude Opus 4.1 (US)", - "display_name": "Claude Opus 4.1 (US)", + "id": "zai-org/GLM-4.7", + "name": "zai-org/GLM-4.7", + "display_name": "zai-org/GLM-4.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 205000, + "output": 205000 }, "temperature": true, "tool_call": true, @@ -88925,300 +91935,243 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "au.anthropic.claude-sonnet-4-5-20250929-v1:0", - "name": "Claude Sonnet 4.5 (AU)", - "display_name": "Claude Sonnet 4.5 (AU)", + "id": "zai-org/GLM-4.5V", + "name": "zai-org/GLM-4.5V", + "display_name": "zai-org/GLM-4.5V", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 66000, + "output": 66000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-08-13", + "last_updated": "2025-11-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.14, + "output": 0.86 }, "type": "chat" }, { - "id": "eu.anthropic.claude-sonnet-4-6", - "name": "Claude Sonnet 4.6 (EU)", - "display_name": "Claude Sonnet 4.6 (EU)", + "id": "zai-org/GLM-5", + "name": "zai-org/GLM-5", + "display_name": "zai-org/GLM-5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 205000, + "output": 205000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1, + "output": 3.2 }, "type": "chat" }, { - "id": "us.meta.llama4-scout-17b-instruct-v1:0", - "name": "Llama 4 Scout 17B Instruct (US)", - "display_name": "Llama 4 Scout 17B Instruct (US)", + "id": "zai-org/GLM-5.1", + "name": "zai-org/GLM-5.1", + "display_name": "zai-org/GLM-5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 3500000, - "output": 16384 + "context": 205000, + "output": 205000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2026-04-08", + "last_updated": "2026-04-08", "cost": { - "input": 0.17, - "output": 0.66 + "input": 1.4, + "output": 4.4, + "cache_write": 0 }, "type": "chat" }, { - "id": "anthropic.claude-opus-4-6-v1", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "zai-org/GLM-4.6", + "name": "zai-org/GLM-4.6", + "display_name": "zai-org/GLM-4.6", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 205000, + "output": 205000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.5, + "output": 1.9 }, "type": "chat" }, { - "id": "jp.anthropic.claude-opus-4-7", - "name": "Claude Opus 4.7 (JP)", - "display_name": "Claude Opus 4.7 (JP)", + "id": "zai-org/GLM-5V-Turbo", + "name": "zai-org/GLM-5V-Turbo", + "display_name": "zai-org/GLM-5V-Turbo", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 200000, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], "interleaved": true, "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1.2, + "output": 4, + "cache_write": 0 }, "type": "chat" - } - ] - }, - "the-grid-ai": { - "id": "the-grid-ai", - "name": "The Grid AI", - "display_name": "The Grid AI", - "api": "https://api.thegrid.ai/v1", - "doc": "https://thegrid.ai/docs", - "models": [ + }, { - "id": "text-prime", - "name": "Text Prime", - "display_name": "Text Prime", + "id": "zai-org/GLM-4.6V", + "name": "zai-org/GLM-4.6V", + "display_name": "zai-org/GLM-4.6V", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 30000 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -89226,16 +92179,20 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "release_date": "2025-12-07", + "last_updated": "2025-12-07", + "cost": { + "input": 0.3, + "output": 0.9 + }, "type": "chat" }, { - "id": "text-standard", - "name": "Text Standard", - "display_name": "Text Standard", + "id": "THUDM/GLM-4-32B-0414", + "name": "THUDM/GLM-4-32B-0414", + "display_name": "THUDM/GLM-4-32B-0414", "modalities": { "input": [ "text" @@ -89245,25 +92202,28 @@ ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 33000, + "output": 33000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "release_date": "2025-04-18", + "last_updated": "2025-11-25", + "cost": { + "input": 0.27, + "output": 0.27 + }, "type": "chat" }, { - "id": "text-max", - "name": "Text Max", - "display_name": "Text Max", + "id": "THUDM/GLM-Z1-32B-0414", + "name": "THUDM/GLM-Z1-32B-0414", + "display_name": "THUDM/GLM-Z1-32B-0414", "modalities": { "input": [ "text" @@ -89273,8 +92233,8 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -89284,23 +92244,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2026-03-24", - "last_updated": "2026-03-24", + "release_date": "2025-04-18", + "last_updated": "2025-11-25", + "cost": { + "input": 0.14, + "output": 0.57 + }, "type": "chat" - } - ] - }, - "baseten": { - "id": "baseten", - "name": "Baseten", - "display_name": "Baseten", - "api": "https://inference.baseten.co/v1", - "doc": "https://docs.baseten.co/development/model-apis/overview", - "models": [ + }, { - "id": "zai-org/GLM-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "THUDM/GLM-4-9B-0414", + "name": "THUDM/GLM-4-9B-0414", + "display_name": "THUDM/GLM-4-9B-0414", "modalities": { "input": [ "text" @@ -89310,41 +92265,28 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 33000, + "output": 33000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": false, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0.086, + "output": 0.086 }, "type": "chat" }, { - "id": "zai-org/GLM-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "THUDM/GLM-Z1-9B-0414", + "name": "THUDM/GLM-Z1-9B-0414", + "display_name": "THUDM/GLM-Z1-9B-0414", "modalities": { "input": [ "text" @@ -89354,8 +92296,8 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -89363,32 +92305,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.95, - "output": 3.15 + "input": 0.086, + "output": 0.086 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "tencent/Hunyuan-A13B-Instruct", + "name": "tencent/Hunyuan-A13B-Instruct", + "display_name": "tencent/Hunyuan-A13B-Instruct", "modalities": { "input": [ "text" @@ -89398,34 +92328,28 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-08-31", - "release_date": "2025-09-16", - "last_updated": "2025-09-16", + "open_weights": false, + "release_date": "2025-06-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "nvidia/Nemotron-120B-A12B", - "name": "Nemotron 3 Super", - "display_name": "Nemotron 3 Super", + "id": "tencent/Hunyuan-MT-7B", + "name": "tencent/Hunyuan-MT-7B", + "display_name": "tencent/Hunyuan-MT-7B", "modalities": { "input": [ "text" @@ -89435,41 +92359,28 @@ ] }, "limit": { - "context": 262144, - "output": 32678 + "context": 33000, + "output": 33000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2026-02", - "release_date": "2026-03-11", - "last_updated": "2026-03-11", + "open_weights": false, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 0.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "nex-agi/DeepSeek-V3.1-Nex-N1", + "name": "nex-agi/DeepSeek-V3.1-Nex-N1", + "display_name": "nex-agi/DeepSeek-V3.1-Nex-N1", "modalities": { "input": [ "text" @@ -89479,7 +92390,7 @@ ] }, "limit": { - "context": 164000, + "context": 131000, "output": 131000 }, "temperature": true, @@ -89489,19 +92400,19 @@ "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-25", - "last_updated": "2025-08-25", + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-11-25", "cost": { "input": 0.5, - "output": 1.5 + "output": 2 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3-0324", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", + "name": "meta-llama/Meta-Llama-3.1-8B-Instruct", + "display_name": "meta-llama/Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" @@ -89511,8 +92422,8 @@ ] }, "limit": { - "context": 164000, - "output": 131000 + "context": 33000, + "output": 4000 }, "temperature": true, "tool_call": true, @@ -89520,20 +92431,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "open_weights": false, + "release_date": "2025-04-23", + "last_updated": "2025-11-25", "cost": { - "input": 0.77, - "output": 0.77 + "input": 0.06, + "output": 0.06 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", "modalities": { "input": [ "text" @@ -89543,41 +92453,33 @@ ] }, "limit": { - "context": 163800, - "output": 131100 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-10", - "release_date": "2025-12-01", - "last_updated": "2026-03-06", + "open_weights": false, + "release_date": "2025-09-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 0.45 + "input": 0.21, + "output": 0.57 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "MiniMaxAI/MiniMax-M2.1", + "name": "MiniMaxAI/MiniMax-M2.1", + "display_name": "MiniMaxAI/MiniMax-M2.1", "modalities": { "input": [ "text" @@ -89587,14 +92489,13 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 197000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -89602,20 +92503,19 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.1, - "output": 0.5 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMaxAI/MiniMax-M2.5", + "display_name": "MiniMaxAI/MiniMax-M2.5", "modalities": { "input": [ "text" @@ -89625,88 +92525,64 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 197000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2026-03-06", + "open_weights": false, + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 0.6, - "output": 2.5 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "baidu/ERNIE-4.5-300B-A47B", + "name": "baidu/ERNIE-4.5-300B-A47B", + "display_name": "baidu/ERNIE-4.5-300B-A47B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "attachment": false, + "open_weights": false, + "release_date": "2025-07-02", + "last_updated": "2025-11-25", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.28, + "output": 1.1 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "Kimi K2 Instruct 0905", - "display_name": "Kimi K2 Instruct 0905", + "id": "stepfun-ai/Step-3.5-Flash", + "name": "stepfun-ai/Step-3.5-Flash", + "display_name": "stepfun-ai/Step-3.5-Flash", "modalities": { "input": [ "text" @@ -89716,40 +92592,42 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-09-05", - "last_updated": "2026-03-06", + "open_weights": false, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.6, - "output": 2.5 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 8192 + "context": 66000, + "output": 66000 }, "temperature": true, "tool_call": true, @@ -89769,20 +92647,19 @@ } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-01-30", - "last_updated": "2026-02-12", + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.6, - "output": 3 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen/Qwen3-235B-A22B-Thinking-2507", "modalities": { "input": [ "text" @@ -89792,8 +92669,8 @@ ] }, "limit": { - "context": 204000, - "output": 204000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -89813,31 +92690,31 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "release_date": "2025-07-28", + "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.13, + "output": 0.6 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V4-Pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "name": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "display_name": "Qwen/Qwen3-VL-235B-A22B-Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -89856,84 +92733,62 @@ ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.15 + "input": 0.45, + "output": 3.5 }, "type": "chat" - } - ] - }, - "frogbot": { - "id": "frogbot", - "name": "FrogBot", - "display_name": "FrogBot", - "api": "https://app.frogbot.ai/api/v1", - "doc": "https://docs.frogbot.ai", - "models": [ + }, { - "id": "grok-4-1-fast-reasoning", - "name": "Grok 4.1 Fast (Reasoning)", - "display_name": "Grok 4.1 Fast (Reasoning)", + "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 128000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-25", + "release_date": "2025-09-18", "last_updated": "2025-11-25", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.14, + "output": 1.4 }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "name": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "display_name": "Qwen/Qwen3-Next-80B-A3B-Thinking", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -89943,44 +92798,45 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2025-09-25", + "last_updated": "2025-11-25", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi-K2.5", - "display_name": "Kimi-K2.5", + "id": "Qwen/Qwen3-32B", + "name": "Qwen/Qwen3-32B", + "display_name": "Qwen/Qwen3-32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -89995,200 +92851,122 @@ }, "attachment": false, "open_weights": false, - "release_date": "1970-01-01", - "last_updated": "1970-01-01", + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "display_name": "Qwen/Qwen3-30B-A3B-Instruct-2507", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "release_date": "2025-07-30", + "last_updated": "2025-11-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.09, + "output": 0.3 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "Qwen/Qwen3-8B", + "name": "Qwen/Qwen3-8B", + "display_name": "Qwen/Qwen3-8B", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 + "input": 0.06, + "output": 0.06 }, "type": "chat" }, { - "id": "claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "release_date": "2025-08-01", + "last_updated": "2025-11-25", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "zai-glm-5-1", - "name": "Z.AI GLM-5.1", - "display_name": "Z.AI GLM-5.1", + "id": "Qwen/Qwen2.5-14B-Instruct", + "name": "Qwen/Qwen2.5-14B-Instruct", + "display_name": "Qwen/Qwen2.5-14B-Instruct", "modalities": { "input": [ "text" @@ -90198,87 +92976,61 @@ ] }, "limit": { - "context": 198000, - "output": 8192 + "context": 33000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-01-20", - "last_updated": "2025-02-22", + "attachment": false, + "open_weights": false, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", "modalities": { "input": [ "text", "image", - "audio", - "video", - "pdf" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 66000, + "output": 66000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "Grok 4.1 Fast (Non-Reasoning)", - "display_name": "Grok 4.1 Fast (Non-Reasoning)", + "id": "Qwen/Qwen2.5-VL-72B-Instruct", + "name": "Qwen/Qwen2.5-VL-72B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-72B-Instruct", "modalities": { "input": [ "text", @@ -90289,8 +93041,8 @@ ] }, "limit": { - "context": 2000000, - "output": 128000 + "context": 131000, + "output": 4000 }, "temperature": true, "tool_call": true, @@ -90299,20 +93051,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-25", + "release_date": "2025-01-28", "last_updated": "2025-11-25", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.59, + "output": 0.59 }, "type": "chat" }, { - "id": "gpt-5-4-nano", - "name": "GPT-5.4 Nano", - "display_name": "GPT-5.4 Nano", + "id": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", "modalities": { "input": [ "text", @@ -90323,164 +93073,103 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 0.3, + "output": 1.5 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "display_name": "Qwen/Qwen3-235B-A22B-Instruct-2507", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-07-17", - "last_updated": "2025-07-17", + "release_date": "2025-07-23", + "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075 + "input": 0.09, + "output": 0.6 }, "type": "chat" }, { - "id": "grok-code-fast-1", - "name": "Grok 4.1 Fast (Reasoning)", - "display_name": "Grok 4.1 Fast (Reasoning)", + "id": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", "modalities": { "input": [ - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 66000, + "output": 66000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "gpt-5-5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "Qwen/QwQ-32B", + "name": "Qwen/QwQ-32B", + "display_name": "Qwen/QwQ-32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 131000, + "output": 131000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -90489,76 +93178,60 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "release_date": "2025-03-06", + "last_updated": "2025-11-25", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 0.15, + "output": 0.58 }, "type": "chat" }, { - "id": "grok-4-3", - "name": "Grok 4.3", - "display_name": "Grok 4.3", + "id": "Qwen/Qwen3-VL-32B-Instruct", + "name": "Qwen/Qwen3-VL-32B-Instruct", + "display_name": "Qwen/Qwen3-VL-32B-Instruct", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2026-04-30", - "last_updated": "2026-04-30", + "release_date": "2025-10-21", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "gpt-5-4-mini", - "name": "GPT-5.4 Mini", - "display_name": "GPT-5.4 Mini", + "id": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "name": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "display_name": "Qwen/Qwen3-VL-30B-A3B-Thinking", "modalities": { "input": [ "text", @@ -90569,160 +93242,72 @@ ] }, "limit": { - "context": 400000, - "output": 128000 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", - "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 - }, - "type": "chat" - }, - { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 128000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "release_date": "2025-10-11", + "last_updated": "2025-11-25", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.29, + "output": 1 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek v4 Pro", - "display_name": "DeepSeek v4 Pro", + "id": "Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen/Qwen2.5-VL-32B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-32B-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2026-01", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2025-03-24", + "last_updated": "2025-11-25", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.14 + "input": 0.27, + "output": 0.27 }, "type": "chat" }, { - "id": "gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "Qwen/Qwen2.5-72B-Instruct-128K", + "name": "Qwen/Qwen2.5-72B-Instruct-128K", + "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", "modalities": { "input": [ "text" @@ -90732,69 +93317,60 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 131000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "1970-01-01", - "last_updated": "1970-01-01", + "open_weights": false, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.07, - "output": 0.2 + "input": 0.59, + "output": 0.59 }, "type": "chat" }, { - "id": "qwen-3-6-plus", - "name": "Qwen 3.6 Plus", - "display_name": "Qwen 3.6 Plus", + "id": "Qwen/Qwen3-VL-8B-Instruct", + "name": "Qwen/Qwen3-VL-8B-Instruct", + "display_name": "Qwen/Qwen3-VL-8B-Instruct", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-03", + "release_date": "2025-10-15", + "last_updated": "2025-11-25", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.1 + "input": 0.18, + "output": 0.68 }, "type": "chat" }, { - "id": "minimax-m2-7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "Qwen/Qwen2.5-7B-Instruct", + "name": "Qwen/Qwen2.5-7B-Instruct", + "display_name": "Qwen/Qwen2.5-7B-Instruct", "modalities": { "input": [ "text" @@ -90804,41 +93380,40 @@ ] }, "limit": { - "context": 192000, - "output": 8192 + "context": 33000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.05, + "output": 0.05 }, "type": "chat" }, { - "id": "minimax-m2-5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "Qwen/Qwen2.5-VL-7B-Instruct", + "name": "Qwen/Qwen2.5-VL-7B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-7B-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 192000, - "output": 8192 + "context": 33000, + "output": 4000 }, "temperature": true, "tool_call": true, @@ -90847,54 +93422,60 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-01-15", - "last_updated": "2025-02-22", + "release_date": "2025-01-28", + "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 0.05, + "output": 0.05 }, "type": "chat" }, { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "Qwen/Qwen3-14B", + "name": "Qwen/Qwen3-14B", + "display_name": "Qwen/Qwen3-14B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", "modalities": { "input": [ "text" @@ -90904,185 +93485,145 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 33000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "1970-01-01", - "last_updated": "1970-01-01", + "open_weights": false, + "release_date": "2024-11-11", + "last_updated": "2025-11-25", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.18, + "output": 0.18 }, "type": "chat" }, { - "id": "gemini-3-1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "name": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-VL-30B-A3B-Instruct", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2026-01", - "release_date": "2026-02-18", - "last_updated": "2026-02-18", + "release_date": "2025-10-05", + "last_updated": "2025-11-25", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2 + "input": 0.29, + "output": 1 }, "type": "chat" }, { - "id": "kimi-k2-6", - "name": "Kimi-K2.6", - "display_name": "Kimi-K2.6", + "id": "Qwen/Qwen3-235B-A22B", + "name": "Qwen/Qwen3-235B-A22B", + "display_name": "Qwen/Qwen3-235B-A22B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "1970-01-01", - "last_updated": "1970-01-01", + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.35, + "output": 1.42 }, "type": "chat" }, { - "id": "gpt-5-3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "display_name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-02-15", - "last_updated": "2026-02-15", + "release_date": "2025-07-31", + "last_updated": "2025-11-25", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.25, + "output": 1 }, "type": "chat" - } - ] - }, - "zhipuai-coding-plan": { - "id": "zhipuai-coding-plan", - "name": "Zhipu AI Coding Plan", - "display_name": "Zhipu AI Coding Plan", - "api": "https://open.bigmodel.cn/api/coding/paas/v4", - "doc": "https://docs.bigmodel.cn/cn/coding-plan/overview", - "models": [ + }, { - "id": "glm-5v-turbo", - "name": "GLM-5V-Turbo", - "display_name": "GLM-5V-Turbo", + "id": "Qwen/Qwen3-VL-8B-Thinking", + "name": "Qwen/Qwen3-VL-8B-Thinking", + "display_name": "Qwen/Qwen3-VL-8B-Thinking", "modalities": { "input": [ "text", - "image", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -91103,20 +93644,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "release_date": "2025-10-15", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.18, + "output": 2 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "name": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "display_name": "Qwen/Qwen3-30B-A3B-Thinking-2507", "modalities": { "input": [ "text" @@ -91126,8 +93665,8 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 262000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -91148,20 +93687,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "release_date": "2025-07-31", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.09, + "output": 0.3 }, "type": "chat" }, { - "id": "glm-5-turbo", - "name": "GLM-5-Turbo", - "display_name": "GLM-5-Turbo", + "id": "Qwen/Qwen2.5-32B-Instruct", + "name": "Qwen/Qwen2.5-32B-Instruct", + "display_name": "Qwen/Qwen2.5-32B-Instruct", "modalities": { "input": [ "text" @@ -91171,42 +93708,28 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 33000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "release_date": "2024-09-19", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.18, + "output": 0.18 }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen/Qwen2.5-72B-Instruct", + "display_name": "Qwen/Qwen2.5-72B-Instruct", "modalities": { "input": [ "text" @@ -91216,43 +93739,40 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 33000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": false, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.59, + "output": 0.59 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "Qwen/Qwen3-VL-32B-Thinking", + "name": "Qwen/Qwen3-VL-32B-Thinking", + "display_name": "Qwen/Qwen3-VL-32B-Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -91271,32 +93791,57 @@ ] } }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-21", + "last_updated": "2025-11-25", + "cost": { + "input": 0.2, + "output": 1.5 + }, + "type": "chat" + }, + { + "id": "inclusionAI/Ring-flash-2.0", + "name": "inclusionAI/Ring-flash-2.0", + "display_name": "inclusionAI/Ring-flash-2.0", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131000, + "output": 131000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": false, + "release_date": "2025-09-29", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.14, + "output": 0.57 }, "type": "chat" - } - ] - }, - "alibaba-coding-plan": { - "id": "alibaba-coding-plan", - "name": "Alibaba Coding Plan", - "display_name": "Alibaba Coding Plan", - "api": "https://coding-intl.dashscope.aliyuncs.com/v1", - "doc": "https://www.alibabacloud.com/help/en/model-studio/coding-plan", - "models": [ + }, { - "id": "qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "inclusionAI/Ling-flash-2.0", + "name": "inclusionAI/Ling-flash-2.0", + "display_name": "inclusionAI/Ling-flash-2.0", "modalities": { "input": [ "text" @@ -91306,8 +93851,8 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -91315,70 +93860,50 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "inclusionAI/Ling-mini-2.0", + "name": "inclusionAI/Ling-mini-2.0", + "display_name": "inclusionAI/Ling-mini-2.0", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "attachment": false, + "open_weights": false, + "release_date": "2025-09-10", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "deepseek-ai/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -91388,8 +93913,8 @@ ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -91410,21 +93935,20 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "deepseek-ai/deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -91434,8 +93958,8 @@ ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -91455,32 +93979,44 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" - }, + } + ] + }, + "google-vertex": { + "id": "google-vertex", + "name": "Vertex", + "display_name": "Vertex", + "doc": "https://cloud.google.com/vertex-ai/generative-ai/docs/models", + "models": [ { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "gemini-flash-latest", + "name": "Gemini Flash Latest", + "display_name": "Gemini Flash Latest", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 24576 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -91488,45 +94024,37 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.383 }, "type": "chat" }, { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "gemini-2.5-flash-preview-09-2025", + "name": "Gemini 2.5 Flash Preview 09-25", + "display_name": "Gemini 2.5 Flash Preview 09-25", "modalities": { "input": [ "text", "image", - "video" + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 1048576, "output": 65536 }, "temperature": true, @@ -91538,121 +94066,182 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.383 }, "type": "chat" }, { - "id": "qwen3-max-2026-01-23", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-01-23", - "last_updated": "2026-01-23", + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "qwen3-coder-next", - "name": "Qwen3 Coder Next", - "display_name": "Qwen3 Coder Next", + "id": "gemini-2.5-flash-lite-preview-06-17", + "name": "Gemini 2.5 Flash Lite Preview 06-17", + "display_name": "Gemini 2.5 Flash Lite Preview 06-17", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 65536, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-03", - "last_updated": "2026-02-03", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "qwen3.5-plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", - "video" + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 1048576, "output": 65536 }, "temperature": true, @@ -91664,51 +94253,55 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.383 }, "type": "chat" - } - ] - }, - "venice": { - "id": "venice", - "name": "Venice AI", - "display_name": "Venice AI", - "doc": "https://docs.venice.ai", - "models": [ + }, { - "id": "openai-gpt-4o-mini-2024-07-18", - "name": "GPT-4o Mini", - "display_name": "GPT-4o Mini", + "id": "gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1048576, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -91717,90 +94310,87 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-02-28", - "last_updated": "2026-03-06", + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.1875, - "output": 0.75, - "cache_read": 0.09375 + "input": 0.15, + "output": 0.6, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "qwen3-next-80b", - "name": "Qwen 3 Next 80b", - "display_name": "Qwen 3 Next 80b", + "id": "deepseek-ai/deepseek-v3.1-maas", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 163840, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-04-29", - "last_updated": "2026-03-12", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0.35, - "output": 1.9 + "input": 0.6, + "output": 1.7 }, "type": "chat" }, { - "id": "grok-4-20-multi-agent", - "name": "Grok 4.20 Multi-Agent", - "display_name": "Grok 4.20 Multi-Agent", + "id": "deepseek-ai/deepseek-v3.2-maas", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text", - "image" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 128000 + "context": 163840, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-12", - "last_updated": "2026-05-07", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-17", + "last_updated": "2026-04-04", "cost": { - "input": 1.42, - "output": 2.83, - "cache_read": 0.23, - "context_over_200k": { - "input": 2.83, - "output": 5.67, - "cache_read": 0.45 - } + "input": 0.56, + "output": 1.68, + "cache_read": 0.056 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen 3 235B A22B Instruct 2507", - "display_name": "Qwen 3 235B A22B Instruct 2507", + "id": "moonshotai/kimi-k2-thinking-maas", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -91810,40 +94400,51 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-04-29", - "last_updated": "2026-03-12", + "knowledge": "2024-08", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.15, - "output": 0.75 + "input": 0.6, + "output": 2.5 }, "type": "chat" }, { - "id": "z-ai-glm-5v-turbo", - "name": "GLM 5V Turbo", - "display_name": "GLM 5V Turbo", + "id": "openai/gpt-oss-20b-maas", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 131072, "output": 32768 }, "temperature": true, @@ -91852,65 +94453,63 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-12", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.5, - "output": 5, - "cache_read": 0.3 + "input": 0.07, + "output": 0.25 }, "type": "chat" }, { - "id": "gemma-4-uncensored", - "name": "Gemma 4 Uncensored", - "display_name": "Gemma 4 Uncensored", + "id": "openai/gpt-oss-120b-maas", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-13", - "last_updated": "2026-04-19", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.1625, - "output": 0.5 + "input": 0.09, + "output": 0.36 }, "type": "chat" }, { - "id": "grok-41-fast", - "name": "Grok 4.1 Fast", - "display_name": "Grok 4.1 Fast", + "id": "zai-org/glm-5-maas", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 30000 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -91918,84 +94517,77 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-12-01", - "last_updated": "2026-04-09", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.23, - "output": 0.57, - "cache_read": 0.06 + "input": 1, + "output": 3.2, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "zai-org/glm-4.7-maas", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text", - "image" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-16", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-06", + "last_updated": "2026-01-06", "cost": { - "input": 3.6, - "output": 18, - "cache_read": 0.36, - "cache_write": 4.5 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "nvidia-nemotron-cascade-2-30b-a3b", - "name": "Nemotron Cascade 2 30B A3B", - "display_name": "Nemotron Cascade 2 30B A3B", + "id": "qwen/qwen3-235b-a22b-instruct-2507-maas", + "name": "Qwen3 235B A22B Instruct", + "display_name": "Qwen3 235B A22B Instruct", "modalities": { "input": [ "text" @@ -92005,8 +94597,8 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -92016,76 +94608,50 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-24", - "last_updated": "2026-04-09", + "release_date": "2025-08-13", + "last_updated": "2025-08-13", "cost": { - "input": 0.14, - "output": 0.8 + "input": 0.22, + "output": 0.88 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "meta/llama-3.3-70b-instruct-maas", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-19", - "last_updated": "2026-03-12", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.7, - "output": 3.75, - "cache_read": 0.07 + "input": 0.72, + "output": 0.72 }, "type": "chat" }, { - "id": "grok-4-20", - "name": "Grok 4.20", - "display_name": "Grok 4.20", + "id": "meta/llama-4-maverick-17b-128e-instruct-maas", + "name": "Llama 4 Maverick 17B 128E Instruct", + "display_name": "Llama 4 Maverick 17B 128E Instruct", "modalities": { "input": [ "text", @@ -92096,48 +94662,44 @@ ] }, "limit": { - "context": 2000000, - "output": 128000 + "context": 524288, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-03-12", - "last_updated": "2026-05-07", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 1.42, - "output": 2.83, - "cache_read": 0.23, - "context_over_200k": { - "input": 2.83, - "output": 5.67, - "cache_read": 0.45 - } + "input": 0.35, + "output": 1.15 }, "type": "chat" }, { - "id": "google-gemma-4-26b-a4b-it", - "name": "Google Gemma 4 26B A4B Instruct", - "display_name": "Google Gemma 4 26B A4B Instruct", + "id": "gemini-3.1-flash-lite", + "name": "Gemini 3.1 Flash Lite", + "display_name": "Gemini 3.1 Flash Lite", "modalities": { "input": [ "text", "image", - "video" + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -92145,124 +94707,116 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-12", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-05-07", + "last_updated": "2026-05-07", "cost": { - "input": 0.1625, - "output": 0.5 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, + "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 6, - "output": 30, - "cache_read": 0.6, - "cache_write": 7.5 - }, - "type": "chat" - }, - { - "id": "qwen3-coder-480b-a35b-instruct-turbo", - "name": "Qwen 3 Coder 480B Turbo", - "display_name": "Qwen 3 Coder 480B Turbo", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + }, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } ] }, - "limit": { - "context": 256000, - "output": 65536 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-02-26", - "cost": { - "input": 0.35, - "output": 1.5, - "cache_read": 0.04 - }, "type": "chat" }, { - "id": "qwen3-5-397b-a17b", - "name": "Qwen 3.5 397B", - "display_name": "Qwen 3.5 397B", + "id": "gemini-2.5-flash-preview-04-17", + "name": "Gemini 2.5 Flash Preview 04-17", + "display_name": "Gemini 2.5 Flash Preview 04-17", "modalities": { "input": [ "text", "image", - "video" + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -92270,31 +94824,57 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-16", - "last_updated": "2026-04-16", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-04-17", + "last_updated": "2025-04-17", "cost": { - "input": 0.75, - "output": 4.5 + "input": 0.15, + "output": 0.6, + "cache_read": 0.0375 }, "type": "chat" }, { - "id": "zai-org-glm-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "gemini-2.5-flash-preview-05-20", + "name": "Gemini 2.5 Flash Preview 05-20", + "display_name": "Gemini 2.5 Flash Preview 05-20", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 198000, - "output": 16384 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -92305,42 +94885,54 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-24", - "last_updated": "2026-03-12", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 0.55, - "output": 2.65, - "cache_read": 0.11 + "input": 0.15, + "output": 0.6, + "cache_read": 0.0375 }, "type": "chat" }, { - "id": "openai-gpt-54", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "gemini-2.5-pro-preview-06-05", + "name": "Gemini 2.5 Pro Preview 06-05", + "display_name": "Gemini 2.5 Pro Preview 06-05", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -92348,32 +94940,56 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-03-05", - "last_updated": "2026-03-09", + "knowledge": "2025-01", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "cost": { - "input": 3.13, - "output": 18.8, - "cache_read": 0.313 + "input": 1.25, + "output": 10, + "cache_read": 0.31 }, "type": "chat" }, { - "id": "zai-org-glm-4.7-flash", - "name": "GLM 4.7 Flash", - "display_name": "GLM 4.7 Flash", + "id": "gemini-2.5-pro-preview-05-06", + "name": "Gemini 2.5 Pro Preview 05-06", + "display_name": "Gemini 2.5 Pro Preview 05-06", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -92381,106 +94997,171 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-01-29", - "last_updated": "2026-03-12", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-05-06", + "last_updated": "2025-05-06", "cost": { - "input": 0.125, - "output": 0.5 + "input": 1.25, + "output": 10, + "cache_read": 0.31 }, "type": "chat" }, { - "id": "nvidia-nemotron-3-nano-30b-a3b", - "name": "NVIDIA Nemotron 3 Nano 30B", - "display_name": "NVIDIA Nemotron 3 Nano 30B", + "id": "gemini-2.5-flash-lite-preview-09-2025", + "name": "Gemini 2.5 Flash Lite Preview 09-25", + "display_name": "Gemini 2.5 Flash Lite Preview 09-25", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-03-12", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.075, - "output": 0.3 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b", - "name": "Qwen3 VL 235B", - "display_name": "Qwen3 VL 235B", + "id": "gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, - "open_weights": true, - "release_date": "2026-01-16", - "last_updated": "2026-03-12", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.25, - "output": 1.5 + "input": 0.1, + "output": 0.4, + "cache_read": 0.01, + "input_audio": 0.3 }, "type": "chat" }, { - "id": "openai-gpt-53-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "gemini-flash-lite-latest", + "name": "Gemini Flash-Lite Latest", + "display_name": "Gemini Flash-Lite Latest", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -92490,30 +95171,34 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-03-12", + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 2.19, - "output": 17.5, - "cache_read": 0.219 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "venice-uncensored-1-2", - "name": "Venice Uncensored 1.2", - "display_name": "Venice Uncensored 1.2", + "id": "gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "display_name": "Gemini 2.0 Flash Lite", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 1048576, "output": 8192 }, "temperature": true, @@ -92522,29 +95207,34 @@ "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-19", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.2, - "output": 0.9 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "openai-gpt-52", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "gemini-3.1-pro-preview-customtools", + "name": "Gemini 3.1 Pro Preview Custom Tools", + "display_name": "Gemini 3.1 Pro Preview Custom Tools", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 1048576, "output": 65536 }, "temperature": true, @@ -92553,64 +95243,70 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-13", - "last_updated": "2026-03-12", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 2.19, - "output": 17.5, - "cache_read": 0.219 - }, - "type": "chat" - }, - { - "id": "mistral-small-3-2-24b-instruct", - "name": "Mistral Small 3.2 24B Instruct", - "display_name": "Mistral Small 3.2 24B Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" + "input": 2, + "output": 12, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } ] }, - "limit": { - "context": 256000, - "output": 16384 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-01-15", - "last_updated": "2026-03-16", - "cost": { - "input": 0.09375, - "output": 0.25 - }, "type": "chat" }, { - "id": "minimax-m27", - "name": "MiniMax M2.7", - "display_name": "MiniMax M2.7", + "id": "gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 198000, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -92618,32 +95314,43 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-03-18", - "last_updated": "2026-04-12", + "knowledge": "2025-01", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.375, + "input": 0.25, "output": 1.5, - "cache_read": 0.075 + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen 3 235B A22B Thinking 2507", - "display_name": "Qwen 3 235B A22B Thinking 2507", + "id": "gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -92654,41 +95361,66 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-04-29", - "last_updated": "2026-03-12", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.45, - "output": 3.5 + "input": 2, + "output": 12, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "qwen3-5-35b-a3b", - "name": "Qwen 3.5 35B A3B", - "display_name": "Qwen 3.5 35B A3B", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ "text", "image", - "video" + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 1048576, "output": 65536 }, "temperature": true, @@ -92697,21 +95429,42 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-25", - "last_updated": "2026-04-16", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.3125, - "output": 1.25, - "cache_read": 0.15625 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "input_audio": 1 }, "type": "chat" }, { - "id": "mercury-2", - "name": "Mercury 2", - "display_name": "Mercury 2", + "id": "gemini-embedding-001", + "name": "Gemini Embedding 001", + "display_name": "Gemini Embedding 001", "modalities": { "input": [ "text" @@ -92721,63 +95474,70 @@ ] }, "limit": { - "context": 128000, - "output": 50000 + "context": 2048, + "output": 3072 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-02-20", - "last_updated": "2026-04-09", + "knowledge": "2025-05", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 0.3125, - "output": 0.9375, - "cache_read": 0.03125 + "input": 0.15, + "output": 0 }, - "type": "chat" - }, + "type": "embedding" + } + ] + }, + "databricks": { + "id": "databricks", + "name": "Databricks", + "display_name": "Databricks", + "api": "https://${DATABRICKS_HOST}/ai-gateway/mlflow/v1", + "doc": "https://docs.databricks.com/aws/en/machine-learning/foundation-models/", + "models": [ { - "id": "google-gemma-3-27b-it", - "name": "Google Gemma 3 27B Instruct", - "display_name": "Google Gemma 3 27B Instruct", + "id": "databricks-gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 198000, - "output": 16384 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-11-04", - "last_updated": "2026-03-12", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.12, + "input": 0.05, "output": 0.2 }, "type": "chat" }, { - "id": "olafangensan-glm-4.7-flash-heretic", - "name": "GLM 4.7 Flash Heretic", - "display_name": "GLM 4.7 Flash Heretic", + "id": "databricks-gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -92787,8 +95547,8 @@ ] }, "limit": { - "context": 200000, - "output": 24000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -92798,22 +95558,25 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-04", - "last_updated": "2026-03-12", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.14, - "output": 0.8 + "input": 0.072, + "output": 0.28 }, "type": "chat" }, { - "id": "openai-gpt-55-pro", - "name": "GPT-5.5 Pro", - "display_name": "GPT-5.5 Pro", + "id": "databricks-gemini-3-pro", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" @@ -92821,7 +95584,7 @@ }, "limit": { "context": 1000000, - "output": 128000 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -92831,30 +95594,49 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-04-25", + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 37.5, - "output": 225 + "input": 2, + "output": 12, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "openai-gpt-52-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "databricks-claude-sonnet-4-5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -92864,63 +95646,36 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08", - "release_date": "2025-01-15", - "last_updated": "2026-03-12", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 2.19, - "output": 17.5, - "cache_read": 0.219 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "venice-uncensored-role-play", - "name": "Venice Role Play Uncensored", - "display_name": "Venice Role Play Uncensored", + "id": "databricks-gemini-3-1-flash-lite", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-20", - "last_updated": "2026-03-16", - "cost": { - "input": 0.5, - "output": 2 - }, - "type": "chat" - }, - { - "id": "zai-org-glm-5", - "name": "GLM 5", - "display_name": "GLM 5", - "modalities": { - "input": [ - "text" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 198000, - "output": 32000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -92928,87 +95683,98 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-03-12", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "zai-org-glm-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "databricks-claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 198000, - "output": 16384 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-01", - "last_updated": "2026-04-04", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.85, - "output": 2.75, - "cache_read": 0.3 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "grok-4-3", - "name": "Grok 4.3", - "display_name": "Grok 4.3", + "id": "databricks-claude-opus-4-1", + "name": "Claude Opus 4.1 (latest)", + "display_name": "Claude Opus 4.1 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 200000, "output": 32000 }, "temperature": true, @@ -93019,24 +95785,21 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-04-18", - "last_updated": "2026-05-04", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.42, - "output": 2.83, - "cache_read": 0.23, - "context_over_200k": { - "input": 2.83, - "output": 5.67, - "cache_read": 0.45 - } + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "mistral-small-2603", - "name": "Mistral Small 4", - "display_name": "Mistral Small 4", + "id": "databricks-gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", @@ -93047,74 +95810,46 @@ ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2026-03-16", - "last_updated": "2026-04-09", - "cost": { - "input": 0.1875, - "output": 0.75 - }, - "type": "chat" - }, - { - "id": "openai-gpt-oss-120b", - "name": "OpenAI GPT OSS 120B", - "display_name": "OpenAI GPT OSS 120B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 16384 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-11-06", - "last_updated": "2026-05-06", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.07, - "output": 0.3 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "databricks-gemini-3-flash", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 198000, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -93122,27 +95857,23 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": true, "open_weights": false, - "release_date": "2025-12-06", - "last_updated": "2026-04-12", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 6, - "output": 30, - "cache_read": 0.6, - "cache_write": 7.5 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "input_audio": 1 }, "type": "chat" }, { - "id": "qwen3-5-9b", - "name": "Qwen 3.5 9B", - "display_name": "Qwen 3.5 9B", + "id": "databricks-gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ "text", @@ -93153,32 +95884,36 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2026-03-05", - "last_updated": "2026-04-19", + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.1, - "output": 0.15 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "databricks-claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -93186,52 +95921,70 @@ }, "limit": { "context": 1000000, - "output": 32768 + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-24", - "last_updated": "2026-04-29", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.17, - "output": 0.35, - "cache_read": 0.028 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openai-gpt-54-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "databricks-claude-opus-4-5", + "name": "Claude Opus 4.5 (latest)", + "display_name": "Claude Opus 4.5 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -93241,22 +95994,21 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-03-05", - "last_updated": "2026-03-09", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 37.5, - "output": 225, - "context_over_200k": { - "input": 75, - "output": 337.5 - } + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openai-gpt-54-mini", - "name": "GPT-5.4 Mini", - "display_name": "GPT-5.4 Mini", + "id": "databricks-gpt-5-4-nano", + "name": "GPT-5.4 nano", + "display_name": "GPT-5.4 nano", "modalities": { "input": [ "text", @@ -93270,7 +96022,7 @@ "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -93278,121 +96030,131 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-31", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.9375, - "output": 5.625, - "cache_read": 0.09375 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "minimax-m25", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "databricks-gpt-5-2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 198000, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-04-12", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.34, - "output": 1.19, - "cache_read": 0.04 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "zai-org-glm-5-1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "databricks-claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 24000 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], "interleaved": true, "summaries": true, - "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-07", - "last_updated": "2026-04-08", + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 1.75, - "output": 5.5, - "cache_read": 0.325 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openai-gpt-55", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "databricks-gpt-5-4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -93400,37 +96162,49 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-04-23", - "last_updated": "2026-04-25", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 6.25, - "output": 37.5, - "cache_read": 0.625, + "input": 2.5, + "output": 15, + "cache_read": 0.25, "context_over_200k": { - "input": 12.5, - "output": 56.25, - "cache_read": 1.25 - } + "input": 5, + "output": 22.5, + "cache_read": 0.5 + }, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "qwen3-6-27b", - "name": "Qwen 3.6 27B", - "display_name": "Qwen 3.6 27B", + "id": "databricks-claude-sonnet-4", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -93440,18 +96214,21 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-04-29", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.325, - "output": 3.25 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "databricks-gpt-5-4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", "modalities": { "input": [ "text", @@ -93462,113 +96239,98 @@ ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-16", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 6, - "output": 30, - "cache_read": 0.6, - "cache_write": 7.5 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "databricks-gpt-5-5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-24", - "last_updated": "2026-04-29", + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 1.73, - "output": 3.796, - "cache_read": 0.33 + "input": 5, + "output": 30, + "cache_read": 0.5, + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + }, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "databricks-gemini-2-5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 160000, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -93576,39 +96338,52 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-10", - "release_date": "2025-12-04", - "last_updated": "2026-03-24", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.33, - "output": 0.48, - "cache_read": 0.16 + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + }, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "qwen-3-6-plus", - "name": "Qwen 3.6 Plus Uncensored", - "display_name": "Qwen 3.6 Plus Uncensored", + "id": "databricks-gemini-2-5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", - "video" + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 1048576, "output": 65536 }, "temperature": true, @@ -93619,71 +96394,108 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-04-06", - "last_updated": "2026-04-12", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.625, - "output": 3.75, - "cache_read": 0.0625, - "cache_write": 0.78, - "context_over_200k": { - "input": 2.5, - "output": 7.5, - "cache_read": 0.0625, - "cache_write": 0.78 - } + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 }, "type": "chat" }, { - "id": "aion-labs-aion-2-0", - "name": "Aion 2.0", - "display_name": "Aion 2.0", + "id": "databricks-gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ + "text", + "image" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 + }, + "type": "chat" + }, + { + "id": "databricks-claude-haiku-4-5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", + "modalities": { + "input": [ + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-24", - "last_updated": "2026-04-12", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { "input": 1, - "output": 2, - "cache_read": 0.25 + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "databricks-gemini-3-1-pro", + "name": "Gemini 3.1 Pro Preview Custom Tools", + "display_name": "Gemini 3.1 Pro Preview Custom Tools", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 198000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -93691,27 +96503,38 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": true, "open_weights": false, - "release_date": "2025-01-15", - "last_updated": "2026-04-12", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 3.75, - "output": 18.75, - "cache_read": 0.375, - "cache_write": 4.69 + "input": 2, + "output": 12, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + }, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ] }, "type": "chat" }, { - "id": "openai-gpt-4o-2024-11-20", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "databricks-gpt-5-1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ "text", @@ -93722,28 +96545,40 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2026-02-28", - "last_updated": "2026-03-06", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 3.125, - "output": 12.5 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" - }, + } + ] + }, + "berget": { + "id": "berget", + "name": "Berget.AI", + "display_name": "Berget.AI", + "api": "https://api.berget.ai/v1", + "doc": "https://api.berget.ai", + "models": [ { - "id": "llama-3.3-70b", - "name": "Llama 3.3 70B", - "display_name": "Llama 3.3 70B", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS-120B", + "display_name": "GPT-OSS-120B", "modalities": { "input": [ "text" @@ -93754,40 +96589,45 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-04-06", - "last_updated": "2026-03-12", + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.7, - "output": 2.8 + "input": 0.44, + "output": 0.99 }, "type": "chat" }, { - "id": "kimi-k2-5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "zai-org/GLM-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -93806,24 +96646,24 @@ ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2026-01-27", - "last_updated": "2026-04-30", + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.56, - "output": 3.5, - "cache_read": 0.22 + "input": 0.77, + "output": 2.75 }, "type": "chat" }, { - "id": "llama-3.2-3b", - "name": "Llama 3.2 3B", - "display_name": "Llama 3.2 3B", + "id": "mistralai/Mistral-Medium-3.5-128B", + "name": "Mistral Medium 3.5 128B", + "display_name": "Mistral Medium 3.5 128B", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -93831,29 +96671,30 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-10-03", - "last_updated": "2026-03-12", + "knowledge": "2026-04", + "release_date": "2026-04-29", + "last_updated": "2026-04-29", "cost": { - "input": 0.15, - "output": 0.6 + "input": 1.65, + "output": 5.5 }, "type": "chat" }, { - "id": "arcee-trinity-large-thinking", - "name": "Trinity Large Thinking", - "display_name": "Trinity Large Thinking", + "id": "mistralai/Mistral-Small-3.2-24B-Instruct-2506", + "name": "Mistral Small 3.2 24B Instruct 2506", + "display_name": "Mistral Small 3.2 24B Instruct 2506", "modalities": { "input": [ "text" @@ -93863,8 +96704,8 @@ ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 32000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -93872,35 +96713,27 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-04", + "knowledge": "2025-09", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", "cost": { - "input": 0.3125, - "output": 1.125, - "cache_read": 0.075 + "input": 0.33, + "output": 0.33 }, "type": "chat" }, { - "id": "hermes-3-llama-3.1-405b", - "name": "Hermes 3 Llama 3.1 405b", - "display_name": "Hermes 3 Llama 3.1 405b", + "id": "google/gemma-4-31B-it", + "name": "Gemma 4 31B Instruct", + "display_name": "Gemma 4 31B Instruct", "modalities": { "input": [ - "text" + "audio", + "image", + "text", + "video" ], "output": [ "text" @@ -93908,42 +96741,40 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-09-25", - "last_updated": "2026-03-12", + "knowledge": "2025-12", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 1.1, - "output": 3 + "input": 0.275, + "output": 0.55 }, "type": "chat" }, { - "id": "gemini-3-1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -93951,39 +96782,34 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-19", - "last_updated": "2026-03-12", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-04-27", + "last_updated": "2025-04-27", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.5, - "cache_write": 0.5, - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "input": 0.99, + "output": 0.99 }, "type": "chat" }, { - "id": "kimi-k2-6", + "id": "moonshotai/Kimi-K2.6", "name": "Kimi K2.6", "display_name": "Kimi K2.6", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -94004,81 +96830,109 @@ }, "attachment": true, "open_weights": true, - "release_date": "2026-04-20", - "last_updated": "2026-04-30", + "knowledge": "2025-01", + "release_date": "2026-05-07", + "last_updated": "2026-05-07", "cost": { - "input": 0.85, - "output": 4.655, - "cache_read": 0.22 + "input": 0.83, + "output": 3.85, + "cache_read": 0.16 + }, + "type": "chat" + } + ] + }, + "moonshot": { + "id": "moonshot", + "name": "Moonshot AI (China)", + "display_name": "Moonshot AI (China)", + "api": "https://api.moonshot.cn/v1", + "doc": "https://platform.moonshot.cn/docs/api/chat", + "models": [ + { + "id": "kimi-k2-turbo-preview", + "name": "Kimi K2 Turbo", + "display_name": "Kimi K2 Turbo", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "cost": { + "input": 2.4, + "output": 10, + "cache_read": 0.6 }, "type": "chat" }, { - "id": "claude-opus-4-6-fast", - "name": "Claude Opus 4.6 Fast", - "display_name": "Claude Opus 4.6 Fast", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 36, - "output": 180, - "cache_read": 3.6, - "cache_write": 45 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "z-ai-glm-5-turbo", - "name": "GLM 5 Turbo", - "display_name": "GLM 5 Turbo", + "id": "kimi-k2-thinking-turbo", + "name": "Kimi K2 Thinking Turbo", + "display_name": "Kimi K2 Thinking Turbo", "modalities": { "input": [ "text" @@ -94088,8 +96942,8 @@ ] }, "limit": { - "context": 200000, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -94097,63 +96951,66 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "release_date": "2026-03-15", - "last_updated": "2026-04-12", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24 + "input": 1.15, + "output": 8, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "google-gemma-4-31b-it", - "name": "Google Gemma 4 31B Instruct", - "display_name": "Google Gemma 4 31B Instruct", + "id": "kimi-k2-0711-preview", + "name": "Kimi K2 0711", + "display_name": "Kimi K2 0711", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-03", - "last_updated": "2026-04-12", + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", "cost": { - "input": 0.175, - "output": 0.5 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" - } - ] - }, - "cerebras": { - "id": "cerebras", - "name": "Cerebras", - "display_name": "Cerebras", - "doc": "https://inference-docs.cerebras.ai/models/overview", - "models": [ + }, { - "id": "llama3.1-8b", - "name": "Llama 3.1 8B", - "display_name": "Llama 3.1 8B", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -94163,29 +97020,42 @@ ] }, "limit": { - "context": 32000, - "output": 8000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "qwen-3-235b-a22b-instruct-2507", - "name": "Qwen 3 235B Instruct", - "display_name": "Qwen 3 235B Instruct", + "id": "kimi-k2-0905-preview", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -94195,8 +97065,8 @@ ] }, "limit": { - "context": 131000, - "output": 32000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -94205,62 +97075,87 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-22", - "last_updated": "2025-07-22", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { "input": 0.6, - "output": 1.2 + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "zai-glm-4.7", - "name": "Z.AI GLM-4.7", - "display_name": "Z.AI GLM-4.7", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 40000 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2026-01-10", - "last_updated": "2026-01-10", + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 2.25, - "output": 2.75, - "cache_read": 0, - "cache_write": 0 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" - }, + } + ] + }, + "alibaba-coding-plan-cn": { + "id": "alibaba-coding-plan-cn", + "name": "Alibaba Coding Plan (China)", + "display_name": "Alibaba Coding Plan (China)", + "api": "https://coding.dashscope.aliyuncs.com/v1", + "doc": "https://help.aliyun.com/zh/model-studio/coding-plan", + "models": [ { - "id": "gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 262144, "output": 32768 }, "temperature": true, @@ -94271,43 +97166,44 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.25, - "output": 0.69 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - } - ] - }, - "lmstudio": { - "id": "lmstudio", - "name": "LMStudio", - "display_name": "LMStudio", - "api": "http://127.0.0.1:1234/v1", - "doc": "https://lmstudio.ai/models", - "models": [ + }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -94317,23 +97213,32 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen/qwen3-coder-30b", - "name": "Qwen3 Coder 30B", - "display_name": "Qwen3 Coder 30B", + "id": "qwen3-coder-next", + "name": "Qwen3 Coder Next", + "display_name": "Qwen3 Coder Next", "modalities": { "input": [ "text" @@ -94353,60 +97258,68 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "release_date": "2026-02-03", + "last_updated": "2026-02-03", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b-2507", - "name": "Qwen3 30B A3B 2507", - "display_name": "Qwen3 30B A3B 2507", + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, + "open_weights": false, "knowledge": "2025-04", - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - } - ] - }, - "lucidquery": { - "id": "lucidquery", - "name": "LucidQuery AI", - "display_name": "LucidQuery AI", - "api": "https://lucidquery.com/api/v1", - "doc": "https://lucidquery.com/api/docs", - "models": [ + }, { - "id": "lucidnova-rf1-100b", - "name": "LucidNova RF1 100B", - "display_name": "LucidNova RF1 100B", + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -94416,30 +97329,42 @@ ] }, "limit": { - "context": 120000, - "output": 8000 + "context": 196608, + "output": 24576 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-09-16", - "release_date": "2024-12-28", - "last_updated": "2025-09-10", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 2, - "output": 5 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "lucidquery-nexus-coder", - "name": "LucidQuery Nexus Coder", - "display_name": "LucidQuery Nexus Coder", + "id": "qwen3-max-2026-01-23", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ "text" @@ -94449,39 +97374,42 @@ ] }, "limit": { - "context": 250000, - "output": 60000 + "context": 262144, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-01", - "release_date": "2025-09-01", - "last_updated": "2025-09-01", + "knowledge": "2025-04", + "release_date": "2026-01-23", + "last_updated": "2026-01-23", "cost": { - "input": 2, - "output": 5 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - } - ] - }, - "moonshot": { - "id": "moonshot", - "name": "Moonshot AI (China)", - "display_name": "Moonshot AI (China)", - "api": "https://api.moonshot.cn/v1", - "doc": "https://platform.moonshot.cn/docs/api/chat", - "models": [ + }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -94491,8 +97419,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 202752, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -94513,20 +97441,21 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "kimi-k2-0711-preview", - "name": "Kimi K2 0711", - "display_name": "Kimi K2 0711", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -94536,30 +97465,42 @@ ] }, "limit": { - "context": 131072, + "context": 202752, "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-14", - "last_updated": "2025-07-14", + "open_weights": false, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "kimi-k2-turbo-preview", - "name": "Kimi K2 Turbo", - "display_name": "Kimi K2 Turbo", + "id": "qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", "modalities": { "input": [ "text" @@ -94569,8 +97510,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -94579,33 +97520,41 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 2.4, - "output": 10, - "cache_read": 0.6 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "minimax-cn": { + "id": "minimax-cn", + "name": "MiniMax (minimaxi.com)", + "display_name": "MiniMax (minimaxi.com)", + "api": "https://api.minimaxi.com/anthropic/v1", + "doc": "https://platform.minimaxi.com/docs/guides/quickstart", + "models": [ { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -94615,31 +97564,23 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "kimi-k2-thinking-turbo", - "name": "Kimi K2 Thinking Turbo", - "display_name": "Kimi K2 Thinking Turbo", + "id": "MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ "text" @@ -94649,8 +97590,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -94671,35 +97612,72 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1.15, - "output": 8, - "cache_read": 0.15 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 + }, + "type": "chat" + }, + { + "id": "MiniMax-M2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -94718,20 +97696,20 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { "input": 0.6, - "output": 3, - "cache_read": 0.1 + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "kimi-k2-0905-preview", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "MiniMax-M2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "display_name": "MiniMax-M2.5-highspeed", "modalities": { "input": [ "text" @@ -94741,51 +97719,93 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "release_date": "2026-02-13", + "last_updated": "2026-02-13", "cost": { "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 + }, + "type": "chat" + }, + { + "id": "MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 196608, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "cost": { + "input": 0.3, + "output": 1.2 }, "type": "chat" } ] }, - "azure-cognitive-services": { - "id": "azure-cognitive-services", - "name": "Azure Cognitive Services", - "display_name": "Azure Cognitive Services", - "doc": "https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models", + "chutes": { + "id": "chutes", + "name": "Chutes", + "display_name": "Chutes", + "api": "https://llm.chutes.ai/v1", + "doc": "https://llm.chutes.ai/v1/models", "models": [ { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "deepseek-ai/DeepSeek-R1-0528-TEE", + "name": "DeepSeek R1 0528 TEE", + "display_name": "DeepSeek R1 0528 TEE", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -94795,39 +97815,41 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.45, + "output": 2.15, + "cache_read": 0.225 }, "type": "chat" }, { - "id": "claude-opus-4-1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "deepseek-ai/DeepSeek-V3.1-TEE", + "name": "DeepSeek V3.1 TEE", + "display_name": "DeepSeek V3.1 TEE", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -94837,39 +97859,73 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.27, + "output": 1, + "cache_read": 0.135 }, "type": "chat" }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "deepseek-ai/DeepSeek-V3-0324-TEE", + "name": "DeepSeek V3 0324 TEE", + "display_name": "DeepSeek V3 0324 TEE", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 163840, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", + "cost": { + "input": 0.25, + "output": 1, + "cache_read": 0.125 + }, + "type": "chat" + }, + { + "id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -94879,38 +97935,41 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.0272, + "output": 0.1087, + "cache_read": 0.0136 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "deepseek-ai/DeepSeek-V3.2-TEE", + "name": "DeepSeek V3.2 TEE", + "display_name": "DeepSeek V3.2 TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -94921,106 +97980,89 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.95, - "output": 4 + "input": 0.28, + "output": 0.42, + "cache_read": 0.14 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "moonshotai/Kimi-K2.5-TEE", + "name": "Kimi K2.5 TEE", + "display_name": "Kimi K2.5 TEE", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 262144, + "output": 65535 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2026-01-27", + "last_updated": "2026-04-25", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25, - "context_over_200k": { - "input": 10, - "output": 37.5, - "cache_read": 1, - "cache_write": 12.5 - } + "input": 0.44, + "output": 2, + "cache_read": 0.22 }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "moonshotai/Kimi-K2.6-TEE", + "name": "Kimi K2.6 TEE", + "display_name": "Kimi K2.6 TEE", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -95030,26 +98072,31 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-04-20", + "last_updated": "2026-04-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.95, + "output": 4, + "cache_read": 0.475 }, "type": "chat" }, { - "id": "mai-ds-r1", - "name": "MAI-DS-R1", - "display_name": "MAI-DS-R1", + "id": "openai/gpt-oss-120b-TEE", + "name": "gpt oss 120b TEE", + "display_name": "gpt oss 120b TEE", "modalities": { "input": [ "text" @@ -95059,63 +98106,85 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 1.35, - "output": 5.4 + "input": 0.09, + "output": 0.36, + "cache_read": 0.045 }, "type": "chat" }, { - "id": "llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama 4 Maverick 17B 128E Instruct FP8", - "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", + "id": "zai-org/GLM-5-TEE", + "name": "GLM 5 TEE", + "display_name": "GLM 5 TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 202752, + "output": 65535 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2026-02-14", + "last_updated": "2026-04-25", "cost": { - "input": 0.25, - "output": 1 + "input": 0.95, + "output": 2.55, + "cache_read": 0.475 }, "type": "chat" }, { - "id": "codestral-2501", - "name": "Codestral 25.01", - "display_name": "Codestral 25.01", + "id": "zai-org/GLM-4.7-TEE", + "name": "GLM 4.7 TEE", + "display_name": "GLM 4.7 TEE", "modalities": { "input": [ "text" @@ -95125,88 +98194,118 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 202752, + "output": 65535 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.39, + "output": 1.75, + "cache_read": 0.195 }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "zai-org/GLM-4.7-FP8", + "name": "GLM 4.7 FP8", + "display_name": "GLM 4.7 FP8", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 202752, + "output": 65535 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-04-25", + "cost": { + "input": 0.2989, + "output": 1.1957, + "cache_read": 0.14945 + }, + "type": "chat" + }, + { + "id": "zai-org/GLM-5.1-TEE", + "name": "GLM 5.1 TEE", + "display_name": "GLM 5.1 TEE", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 202752, + "output": 65535 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "open_weights": true, + "release_date": "2026-04-08", + "last_updated": "2026-04-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 1.05, + "output": 3.5, + "cache_read": 0.525 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "zai-org/GLM-5-Turbo", + "name": "GLM 5 Turbo", + "display_name": "GLM 5 Turbo", "modalities": { "input": [ "text" @@ -95216,8 +98315,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 202752, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -95238,31 +98337,31 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-12-02", + "release_date": "2026-03-11", + "last_updated": "2026-04-25", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 0.4891, + "output": 1.9565, + "cache_read": 0.24455 }, "type": "chat" }, { - "id": "deepseek-r1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "zai-org/GLM-4.6V", + "name": "GLM 4.6V", + "display_name": "GLM 4.6V", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -95281,21 +98380,86 @@ ] } }, + "attachment": true, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", + "cost": { + "input": 0.3, + "output": 0.9, + "cache_read": 0.15 + }, + "type": "chat" + }, + { + "id": "unsloth/gemma-3-27b-it", + "name": "gemma 3 27b it", + "display_name": "gemma 3 27b it", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", + "cost": { + "input": 0.0272, + "output": 0.1087, + "cache_read": 0.0136 + }, + "type": "chat" + }, + { + "id": "unsloth/Mistral-Nemo-Instruct-2407", + "name": "Mistral Nemo Instruct 2407", + "display_name": "Mistral Nemo Instruct 2407", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 1.35, - "output": 5.4 + "input": 0.02, + "output": 0.04, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-instruct", - "name": "GPT-3.5 Turbo Instruct", - "display_name": "GPT-3.5 Turbo Instruct", + "id": "unsloth/Llama-3.2-3B-Instruct", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ "text" @@ -95305,8 +98469,8 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 16384, + "output": 16384 }, "temperature": true, "tool_call": false, @@ -95314,20 +98478,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-09-21", - "last_updated": "2023-09-21", + "open_weights": true, + "release_date": "2025-02-12", + "last_updated": "2026-04-25", "cost": { - "input": 1.5, - "output": 2 + "input": 0.01, + "output": 0.0136, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "mistral-medium-2505", - "name": "Mistral Medium 3", - "display_name": "Mistral Medium 3", + "id": "unsloth/gemma-3-12b-it", + "name": "gemma 3 12b it", + "display_name": "gemma 3 12b it", "modalities": { "input": [ "text", @@ -95338,29 +98502,29 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.4, - "output": 2 + "input": 0.03, + "output": 0.1, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "phi-4-reasoning-plus", - "name": "Phi-4-reasoning-plus", - "display_name": "Phi-4-reasoning-plus", + "id": "unsloth/Llama-3.2-1B-Instruct", + "name": "Llama 3.2 1B Instruct", + "display_name": "Llama 3.2 1B Instruct", "modalities": { "input": [ "text" @@ -95370,61 +98534,106 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 16384, + "output": 8192 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2026-01-27", + "last_updated": "2026-04-25", "cost": { - "input": 0.125, - "output": 0.5 + "input": 0.01, + "output": 0.0109, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "cohere-embed-v3-english", - "name": "Embed v3 English", - "display_name": "Embed v3 English", + "id": "unsloth/gemma-3-4b-it", + "name": "gemma 3 4b it", + "display_name": "gemma 3 4b it", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 512, - "output": 1024 + "context": 96000, + "output": 96000 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, + "attachment": true, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", + "cost": { + "input": 0.01, + "output": 0.0272, + "cache_read": 0.005 + }, + "type": "chat" + }, + { + "id": "NousResearch/Hermes-4-14B", + "name": "Hermes 4 14B", + "display_name": "Hermes 4 14B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 40960, + "output": 40960 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.1, - "output": 0 + "input": 0.0136, + "output": 0.0543, + "cache_read": 0.0068 }, "type": "chat" }, { - "id": "gpt-4-32k", - "name": "GPT-4 32K", - "display_name": "GPT-4 32K", + "id": "NousResearch/DeepHermes-3-Mistral-24B-Preview", + "name": "DeepHermes 3 Mistral 24B Preview", + "display_name": "DeepHermes 3 Mistral 24B Preview", "modalities": { "input": [ "text" @@ -95443,20 +98652,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 60, - "output": 120 + "input": 0.0245, + "output": 0.0978, + "cache_read": 0.01225 }, "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "rednote-hilab/dots.ocr", + "name": "dots.ocr", + "display_name": "dots.ocr", "modalities": { "input": [ "text", @@ -95467,10 +98676,108 @@ ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 131072, + "output": 131072 }, - "temperature": false, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", + "cost": { + "input": 0.01, + "output": 0.0109, + "cache_read": 0.005 + }, + "type": "chat" + }, + { + "id": "google/gemma-4-31B-turbo-TEE", + "name": "gemma 4 31B turbo TEE", + "display_name": "gemma 4 31B turbo TEE", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-04-25", + "last_updated": "2026-04-25", + "cost": { + "input": 0.13, + "output": 0.38, + "cache_read": 0.065 + }, + "type": "chat" + }, + { + "id": "XiaomiMiMo/MiMo-V2-Flash-TEE", + "name": "MiMo V2 Flash TEE", + "display_name": "MiMo V2 Flash TEE", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-04-25", + "last_updated": "2026-04-25", + "cost": { + "input": 0.09, + "output": 0.29, + "cache_read": 0.045 + }, + "type": "chat" + }, + { + "id": "MiniMaxAI/MiniMax-M2.5-TEE", + "name": "MiniMax M2.5 TEE", + "display_name": "MiniMax M2.5 TEE", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 196608, + "output": 65536 + }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -95479,238 +98786,4855 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-15", + "last_updated": "2026-04-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.15, + "output": 1.2, + "cache_read": 0.075 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3.5-397B-A17B-TEE", + "name": "Qwen3.5 397B A17B TEE", + "display_name": "Qwen3.5 397B A17B TEE", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-02-18", + "last_updated": "2026-04-25", + "cost": { + "input": 0.39, + "output": 2.34, + "cache_read": 0.195 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", + "cost": { + "input": 0.11, + "output": 0.6, + "cache_read": 0.055 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", + "cost": { + "input": 0.1, + "output": 0.8, + "cache_read": 0.05 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507-TEE", + "name": "Qwen3 235B A22B Instruct 2507 TEE", + "display_name": "Qwen3 235B A22B Instruct 2507 TEE", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", + "cost": { + "input": 0.1, + "output": 0.6, + "cache_read": 0.05 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3Guard-Gen-0.6B", + "name": "Qwen3Guard Gen 0.6B", + "display_name": "Qwen3Guard Gen 0.6B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32768, + "output": 8192 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", + "cost": { + "input": 0.01, + "output": 0.0109, + "cache_read": 0.005 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-30B-A3B", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 40960, + "output": 40960 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", + "cost": { + "input": 0.06, + "output": 0.22, + "cache_read": 0.03 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen2.5 VL 32B Instruct", + "display_name": "Qwen2.5 VL 32B Instruct", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16384, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", + "cost": { + "input": 0.0543, + "output": 0.2174, + "cache_read": 0.02715 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-32B-TEE", + "name": "Qwen3 32B TEE", + "display_name": "Qwen3 32B TEE", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 40960, + "output": 40960 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-04-25", + "last_updated": "2026-04-25", + "cost": { + "input": 0.08, + "output": 0.24, + "cache_read": 0.04 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-Coder-Next-TEE", + "name": "Qwen3 Coder Next TEE", + "display_name": "Qwen3 Coder Next TEE", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-04-25", + "last_updated": "2026-04-25", + "cost": { + "input": 0.12, + "output": 0.75, + "cache_read": 0.06 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen2.5 Coder 32B Instruct", + "display_name": "Qwen2.5 Coder 32B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32768, + "output": 32768 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", + "cost": { + "input": 0.0272, + "output": 0.1087, + "cache_read": 0.0136 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3.6-27B-TEE", + "name": "Qwen3.6 27B TEE", + "display_name": "Qwen3.6 27B TEE", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-04-25", + "last_updated": "2026-04-25", + "cost": { + "input": 0.195, + "output": 1.56, + "cache_read": 0.0975 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen2.5 72B Instruct", + "display_name": "Qwen2.5 72B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32768, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", + "cost": { + "input": 0.2989, + "output": 1.1957, + "cache_read": 0.14945 + }, + "type": "chat" + }, + { + "id": "tngtech/DeepSeek-TNG-R1T2-Chimera-TEE", + "name": "DeepSeek TNG R1T2 Chimera TEE", + "display_name": "DeepSeek TNG R1T2 Chimera TEE", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 163840, + "output": 163840 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-04-25", + "last_updated": "2026-04-25", + "cost": { + "input": 0.3, + "output": 1.1, + "cache_read": 0.15 + }, + "type": "chat" + } + ] + }, + "siliconflow": { + "id": "siliconflow", + "name": "SiliconFlow", + "display_name": "SiliconFlow", + "api": "https://api.siliconflow.cn/v1", + "doc": "https://cloud.siliconflow.com/models", + "models": [ + { + "id": "Pro/deepseek-ai/DeepSeek-R1", + "name": "Pro/deepseek-ai/DeepSeek-R1", + "display_name": "Pro/deepseek-ai/DeepSeek-R1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-05-28", + "last_updated": "2025-11-25", + "cost": { + "input": 0.5, + "output": 2.18 + }, + "type": "chat" + }, + { + "id": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", + "display_name": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-29", + "last_updated": "2025-11-25", + "cost": { + "input": 0.27, + "output": 1 + }, + "type": "chat" + }, + { + "id": "Pro/deepseek-ai/DeepSeek-V3.2", + "name": "Pro/deepseek-ai/DeepSeek-V3.2", + "display_name": "Pro/deepseek-ai/DeepSeek-V3.2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 164000, + "output": 164000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-12-03", + "last_updated": "2025-12-03", + "cost": { + "input": 0.27, + "output": 0.42 + }, + "type": "chat" + }, + { + "id": "Pro/deepseek-ai/DeepSeek-V3", + "name": "Pro/deepseek-ai/DeepSeek-V3", + "display_name": "Pro/deepseek-ai/DeepSeek-V3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-12-26", + "last_updated": "2025-11-25", + "cost": { + "input": 0.25, + "output": 1 + }, + "type": "chat" + }, + { + "id": "Pro/moonshotai/Kimi-K2-Thinking", + "name": "Pro/moonshotai/Kimi-K2-Thinking", + "display_name": "Pro/moonshotai/Kimi-K2-Thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262000, + "output": 262000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-07", + "last_updated": "2025-11-25", + "cost": { + "input": 0.55, + "output": 2.5 + }, + "type": "chat" + }, + { + "id": "Pro/moonshotai/Kimi-K2.6", + "name": "Pro/moonshotai/Kimi-K2.6", + "display_name": "Pro/moonshotai/Kimi-K2.6", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262000, + "output": 262000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-04-21", + "last_updated": "2026-04-21", + "cost": { + "input": 0.95, + "output": 4, + "cache_read": 0.16 + }, + "type": "chat" + }, + { + "id": "Pro/moonshotai/Kimi-K2.5", + "name": "Pro/moonshotai/Kimi-K2.5", + "display_name": "Pro/moonshotai/Kimi-K2.5", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262000, + "output": 262000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "cost": { + "input": 0.45, + "output": 2.25 + }, + "type": "chat" + }, + { + "id": "Pro/moonshotai/Kimi-K2-Instruct-0905", + "name": "Pro/moonshotai/Kimi-K2-Instruct-0905", + "display_name": "Pro/moonshotai/Kimi-K2-Instruct-0905", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-08", + "last_updated": "2025-11-25", + "cost": { + "input": 0.4, + "output": 2 + }, + "type": "chat" + }, + { + "id": "Pro/zai-org/GLM-4.7", + "name": "Pro/zai-org/GLM-4.7", + "display_name": "Pro/zai-org/GLM-4.7", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 205000, + "output": 205000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "cost": { + "input": 0.6, + "output": 2.2 + }, + "type": "chat" + }, + { + "id": "Pro/zai-org/GLM-5", + "name": "Pro/zai-org/GLM-5", + "display_name": "Pro/zai-org/GLM-5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 205000, + "output": 205000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "cost": { + "input": 1, + "output": 3.2 + }, + "type": "chat" + }, + { + "id": "Pro/zai-org/GLM-5.1", + "name": "Pro/zai-org/GLM-5.1", + "display_name": "Pro/zai-org/GLM-5.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 205000, + "output": 205000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-04-08", + "last_updated": "2026-04-08", + "cost": { + "input": 1.4, + "output": 4.4, + "cache_write": 0 + }, + "type": "chat" + }, + { + "id": "Pro/MiniMaxAI/MiniMax-M2.1", + "name": "Pro/MiniMaxAI/MiniMax-M2.1", + "display_name": "Pro/MiniMaxAI/MiniMax-M2.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 197000, + "output": 131000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "cost": { + "input": 0.3, + "output": 1.2 + }, + "type": "chat" + }, + { + "id": "Pro/MiniMaxAI/MiniMax-M2.5", + "name": "Pro/MiniMaxAI/MiniMax-M2.5", + "display_name": "Pro/MiniMaxAI/MiniMax-M2.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 192000, + "output": 131000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", + "cost": { + "input": 0.3, + "output": 1.22 + }, + "type": "chat" + }, + { + "id": "deepseek-ai/DeepSeek-OCR", + "name": "deepseek-ai/DeepSeek-OCR", + "display_name": "deepseek-ai/DeepSeek-OCR", + "modalities": { + "input": [ + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-10-20", + "last_updated": "2025-10-20", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "deepseek-ai/deepseek-vl2", + "name": "deepseek-ai/deepseek-vl2", + "display_name": "deepseek-ai/deepseek-vl2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-12-13", + "last_updated": "2025-11-25", + "cost": { + "input": 0.15, + "output": 0.15 + }, + "type": "chat" + }, + { + "id": "deepseek-ai/DeepSeek-V3", + "name": "deepseek-ai/DeepSeek-V3", + "display_name": "deepseek-ai/DeepSeek-V3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-12-26", + "last_updated": "2025-11-25", + "cost": { + "input": 0.25, + "output": 1 + }, + "type": "chat" + }, + { + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "deepseek-ai/DeepSeek-V3.2", + "display_name": "deepseek-ai/DeepSeek-V3.2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 164000, + "output": 164000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-12-03", + "last_updated": "2025-12-03", + "cost": { + "input": 0.27, + "output": 0.42 + }, + "type": "chat" + }, + { + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-01-20", + "last_updated": "2025-11-25", + "cost": { + "input": 0.1, + "output": 0.1 + }, + "type": "chat" + }, + { + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-01-20", + "last_updated": "2025-11-25", + "cost": { + "input": 0.18, + "output": 0.18 + }, + "type": "chat" + }, + { + "id": "deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "deepseek-ai/DeepSeek-V3.1-Terminus", + "display_name": "deepseek-ai/DeepSeek-V3.1-Terminus", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-29", + "last_updated": "2025-11-25", + "cost": { + "input": 0.27, + "output": 1 + }, + "type": "chat" + }, + { + "id": "deepseek-ai/DeepSeek-R1", + "name": "deepseek-ai/DeepSeek-R1", + "display_name": "deepseek-ai/DeepSeek-R1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-05-28", + "last_updated": "2025-11-25", + "cost": { + "input": 0.5, + "output": 2.18 + }, + "type": "chat" + }, + { + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "moonshotai/Kimi-K2-Instruct-0905", + "display_name": "moonshotai/Kimi-K2-Instruct-0905", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-08", + "last_updated": "2025-11-25", + "cost": { + "input": 0.4, + "output": 2 + }, + "type": "chat" + }, + { + "id": "moonshotai/Kimi-K2-Thinking", + "name": "moonshotai/Kimi-K2-Thinking", + "display_name": "moonshotai/Kimi-K2-Thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262000, + "output": 262000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-07", + "last_updated": "2025-11-25", + "cost": { + "input": 0.55, + "output": 2.5 + }, + "type": "chat" + }, + { + "id": "zai-org/GLM-4.6V", + "name": "zai-org/GLM-4.6V", + "display_name": "zai-org/GLM-4.6V", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131000, + "output": 131000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-07", + "last_updated": "2025-12-07", + "cost": { + "input": 0.3, + "output": 0.9 + }, + "type": "chat" + }, + { + "id": "zai-org/GLM-4.6", + "name": "zai-org/GLM-4.6", + "display_name": "zai-org/GLM-4.6", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", + "cost": { + "input": 0.5, + "output": 1.9 + }, + "type": "chat" + }, + { + "id": "zai-org/GLM-4.5V", + "name": "zai-org/GLM-4.5V", + "display_name": "zai-org/GLM-4.5V", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-13", + "last_updated": "2025-11-25", + "cost": { + "input": 0.14, + "output": 0.86 + }, + "type": "chat" + }, + { + "id": "zai-org/GLM-4.5-Air", + "name": "zai-org/GLM-4.5-Air", + "display_name": "zai-org/GLM-4.5-Air", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-07-28", + "last_updated": "2025-11-25", + "cost": { + "input": 0.14, + "output": 0.86 + }, + "type": "chat" + }, + { + "id": "THUDM/GLM-Z1-9B-0414", + "name": "THUDM/GLM-Z1-9B-0414", + "display_name": "THUDM/GLM-Z1-9B-0414", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", + "cost": { + "input": 0.086, + "output": 0.086 + }, + "type": "chat" + }, + { + "id": "THUDM/GLM-4-9B-0414", + "name": "THUDM/GLM-4-9B-0414", + "display_name": "THUDM/GLM-4-9B-0414", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", + "cost": { + "input": 0.086, + "output": 0.086 + }, + "type": "chat" + }, + { + "id": "THUDM/GLM-Z1-32B-0414", + "name": "THUDM/GLM-Z1-32B-0414", + "display_name": "THUDM/GLM-Z1-32B-0414", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", + "cost": { + "input": 0.14, + "output": 0.57 + }, + "type": "chat" + }, + { + "id": "THUDM/GLM-4-32B-0414", + "name": "THUDM/GLM-4-32B-0414", + "display_name": "THUDM/GLM-4-32B-0414", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", + "cost": { + "input": 0.27, + "output": 0.27 + }, + "type": "chat" + }, + { + "id": "tencent/Hunyuan-MT-7B", + "name": "tencent/Hunyuan-MT-7B", + "display_name": "tencent/Hunyuan-MT-7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + }, + { + "id": "tencent/Hunyuan-A13B-Instruct", + "name": "tencent/Hunyuan-A13B-Instruct", + "display_name": "tencent/Hunyuan-A13B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-06-30", + "last_updated": "2025-11-25", + "cost": { + "input": 0.14, + "output": 0.57 + }, + "type": "chat" + }, + { + "id": "PaddlePaddle/PaddleOCR-VL", + "name": "PaddlePaddle/PaddleOCR-VL", + "display_name": "PaddlePaddle/PaddleOCR-VL", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16384, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-10-16", + "last_updated": "2025-10-16", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + }, + { + "id": "PaddlePaddle/PaddleOCR-VL-1.5", + "name": "PaddlePaddle/PaddleOCR-VL-1.5", + "display_name": "PaddlePaddle/PaddleOCR-VL-1.5", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16384, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-01-29", + "last_updated": "2026-01-29", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + }, + { + "id": "ascend-tribe/pangu-pro-moe", + "name": "ascend-tribe/pangu-pro-moe", + "display_name": "ascend-tribe/pangu-pro-moe", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-07-02", + "last_updated": "2026-01-16", + "cost": { + "input": 0.2, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-04", + "last_updated": "2025-11-25", + "cost": { + "input": 0.21, + "output": 0.57 + }, + "type": "chat" + }, + { + "id": "Kwaipilot/KAT-Dev", + "name": "Kwaipilot/KAT-Dev", + "display_name": "Kwaipilot/KAT-Dev", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-27", + "last_updated": "2026-01-16", + "cost": { + "input": 0.2, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "baidu/ERNIE-4.5-300B-A47B", + "name": "baidu/ERNIE-4.5-300B-A47B", + "display_name": "baidu/ERNIE-4.5-300B-A47B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-07-02", + "last_updated": "2025-11-25", + "cost": { + "input": 0.28, + "output": 1.1 + }, + "type": "chat" + }, + { + "id": "stepfun-ai/Step-3.5-Flash", + "name": "stepfun-ai/Step-3.5-Flash", + "display_name": "stepfun-ai/Step-3.5-Flash", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262000, + "output": 262000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "cost": { + "input": 0.1, + "output": 0.3 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3.5-9B", + "name": "Qwen/Qwen3.5-9B", + "display_name": "Qwen/Qwen3.5-9B", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", + "cost": { + "input": 0.22, + "output": 1.74 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3.5-4B", + "name": "Qwen/Qwen3.5-4B", + "display_name": "Qwen/Qwen3.5-4B", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3.5-122B-A10B", + "name": "Qwen/Qwen3.5-122B-A10B", + "display_name": "Qwen/Qwen3.5-122B-A10B", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-26", + "last_updated": "2026-02-26", + "cost": { + "input": 0.29, + "output": 2.32 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3.5-397B-A17B", + "name": "Qwen/Qwen3.5-397B-A17B", + "display_name": "Qwen/Qwen3.5-397B-A17B", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", + "cost": { + "input": 0.29, + "output": 1.74 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3.5-27B", + "name": "Qwen/Qwen3.5-27B", + "display_name": "Qwen/Qwen3.5-27B", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-25", + "last_updated": "2026-02-25", + "cost": { + "input": 0.26, + "output": 2.09 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3.5-35B-A3B", + "name": "Qwen/Qwen3.5-35B-A3B", + "display_name": "Qwen/Qwen3.5-35B-A3B", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-25", + "last_updated": "2026-02-25", + "cost": { + "input": 0.23, + "output": 1.86 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3.6-35B-A3B", + "name": "Qwen/Qwen3.6-35B-A3B", + "display_name": "Qwen/Qwen3.6-35B-A3B", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", + "cost": { + "input": 0.23, + "output": 1.86 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-VL-32B-Thinking", + "name": "Qwen/Qwen3-VL-32B-Thinking", + "display_name": "Qwen/Qwen3-VL-32B-Thinking", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262000, + "output": 262000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-21", + "last_updated": "2025-11-25", + "cost": { + "input": 0.2, + "output": 1.5 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen/Qwen2.5-72B-Instruct", + "display_name": "Qwen/Qwen2.5-72B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", + "cost": { + "input": 0.59, + "output": 0.59 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2.5-32B-Instruct", + "name": "Qwen/Qwen2.5-32B-Instruct", + "display_name": "Qwen/Qwen2.5-32B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-09-19", + "last_updated": "2025-11-25", + "cost": { + "input": 0.18, + "output": 0.18 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "name": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "display_name": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-07-31", + "last_updated": "2025-11-25", + "cost": { + "input": 0.09, + "output": 0.3 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-VL-8B-Thinking", + "name": "Qwen/Qwen3-VL-8B-Thinking", + "display_name": "Qwen/Qwen3-VL-8B-Thinking", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262000, + "output": 262000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-15", + "last_updated": "2025-11-25", + "cost": { + "input": 0.18, + "output": 2 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "display_name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-07-31", + "last_updated": "2025-11-25", + "cost": { + "input": 0.25, + "output": 1 + } + }, + { + "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "name": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-05", + "last_updated": "2025-11-25", + "cost": { + "input": 0.29, + "output": 1 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-11-11", + "last_updated": "2025-11-25", + "cost": { + "input": 0.18, + "output": 0.18 + } + }, + { + "id": "Qwen/Qwen3-14B", + "name": "Qwen/Qwen3-14B", + "display_name": "Qwen/Qwen3-14B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-30", + "last_updated": "2025-11-25", + "cost": { + "input": 0.07, + "output": 0.28 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2.5-7B-Instruct", + "name": "Qwen/Qwen2.5-7B-Instruct", + "display_name": "Qwen/Qwen2.5-7B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", + "cost": { + "input": 0.05, + "output": 0.05 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-VL-8B-Instruct", + "name": "Qwen/Qwen3-VL-8B-Instruct", + "display_name": "Qwen/Qwen3-VL-8B-Instruct", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262000, + "output": 262000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-15", + "last_updated": "2025-11-25", + "cost": { + "input": 0.18, + "output": 0.68 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2.5-72B-Instruct-128K", + "name": "Qwen/Qwen2.5-72B-Instruct-128K", + "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", + "cost": { + "input": 0.59, + "output": 0.59 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen/Qwen2.5-VL-32B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-32B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-03-24", + "last_updated": "2025-11-25", + "cost": { + "input": 0.27, + "output": 0.27 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "name": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "display_name": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-11", + "last_updated": "2025-11-25", + "cost": { + "input": 0.29, + "output": 1 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-VL-32B-Instruct", + "name": "Qwen/Qwen3-VL-32B-Instruct", + "display_name": "Qwen/Qwen3-VL-32B-Instruct", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262000, + "output": 262000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-21", + "last_updated": "2025-11-25", + "cost": { + "input": 0.2, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "Qwen/QwQ-32B", + "name": "Qwen/QwQ-32B", + "display_name": "Qwen/QwQ-32B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-03-06", + "last_updated": "2025-11-25", + "cost": { + "input": 0.15, + "output": 0.58 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", + "cost": { + "input": 0.1, + "output": 0.4 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "display_name": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-07-23", + "last_updated": "2025-11-25", + "cost": { + "input": 0.09, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", + "cost": { + "input": 0.3, + "output": 1.5 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2.5-VL-72B-Instruct", + "name": "Qwen/Qwen2.5-VL-72B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-72B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-01-28", + "last_updated": "2025-11-25", + "cost": { + "input": 0.59, + "output": 0.59 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", + "cost": { + "input": 0.1, + "output": 0.4 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2.5-14B-Instruct", + "name": "Qwen/Qwen2.5-14B-Instruct", + "display_name": "Qwen/Qwen2.5-14B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", + "cost": { + "input": 0.1, + "output": 0.1 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-01", + "last_updated": "2025-11-25", + "cost": { + "input": 0.07, + "output": 0.28 + } + }, + { + "id": "Qwen/Qwen3-8B", + "name": "Qwen/Qwen3-8B", + "display_name": "Qwen/Qwen3-8B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-30", + "last_updated": "2025-11-25", + "cost": { + "input": 0.06, + "output": 0.06 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "display_name": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-07-30", + "last_updated": "2025-11-25", + "cost": { + "input": 0.09, + "output": 0.3 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-32B", + "name": "Qwen/Qwen3-32B", + "display_name": "Qwen/Qwen3-32B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-30", + "last_updated": "2025-11-25", + "cost": { + "input": 0.14, + "output": 0.57 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "name": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "display_name": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-25", + "last_updated": "2025-11-25", + "cost": { + "input": 0.14, + "output": 0.57 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", + "cost": { + "input": 0.14, + "output": 1.4 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "name": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "display_name": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", + "cost": { + "input": 0.45, + "output": 3.5 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-07-28", + "last_updated": "2025-11-25", + "cost": { + "input": 0.13, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", + "cost": { + "input": 0.1, + "output": 0.4 + }, + "type": "chat" + }, + { + "id": "inclusionAI/Ling-mini-2.0", + "name": "inclusionAI/Ling-mini-2.0", + "display_name": "inclusionAI/Ling-mini-2.0", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-10", + "last_updated": "2025-11-25", + "cost": { + "input": 0.07, + "output": 0.28 + }, + "type": "chat" + }, + { + "id": "inclusionAI/Ling-flash-2.0", + "name": "inclusionAI/Ling-flash-2.0", + "display_name": "inclusionAI/Ling-flash-2.0", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", + "cost": { + "input": 0.14, + "output": 0.57 + }, + "type": "chat" + }, + { + "id": "inclusionAI/Ring-flash-2.0", + "name": "inclusionAI/Ring-flash-2.0", + "display_name": "inclusionAI/Ring-flash-2.0", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-29", + "last_updated": "2025-11-25", + "cost": { + "input": 0.14, + "output": 0.57 + }, + "type": "chat" + }, + { + "id": "deepseek-ai/DeepSeek-V3.2-Exp", + "name": "deepseek-ai/DeepSeek-V3.2-Exp", + "display_name": "deepseek-ai/DeepSeek-V3.2-Exp", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", + "name": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", + "display_name": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "inclusionAI/Ring-1T", + "name": "inclusionAI/Ring-1T", + "display_name": "inclusionAI/Ring-1T", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "type": "chat" + }, + { + "id": "inclusionAI/Ling-1T", + "name": "inclusionAI/Ling-1T", + "display_name": "inclusionAI/Ling-1T", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen-Image-Edit-2509", + "name": "Qwen/Qwen-Image-Edit-2509", + "display_name": "Qwen/Qwen-Image-Edit-2509", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "image" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "Qwen/Qwen-Image-Edit", + "name": "Qwen/Qwen-Image-Edit", + "display_name": "Qwen/Qwen-Image-Edit", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "image" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "Qwen/Qwen-Image", + "name": "Qwen/Qwen-Image", + "display_name": "Qwen/Qwen-Image", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "Wan-AI/Wan2.2-I2V-A14B", + "name": "Wan-AI/Wan2.2-I2V-A14B", + "display_name": "Wan-AI/Wan2.2-I2V-A14B", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "video" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "Wan-AI/Wan2.2-T2V-A14B", + "name": "Wan-AI/Wan2.2-T2V-A14B", + "display_name": "Wan-AI/Wan2.2-T2V-A14B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "video" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "zai-org/GLM-4.5", + "name": "zai-org/GLM-4.5", + "display_name": "zai-org/GLM-4.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "stepfun-ai/step3", + "name": "stepfun-ai/step3", + "display_name": "stepfun-ai/step3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "TeleAI/TeleSpeechASR", + "name": "TeleAI/TeleSpeechASR", + "display_name": "TeleAI/TeleSpeechASR", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "THUDM/GLM-4.1V-9B-Thinking", + "name": "THUDM/GLM-4.1V-9B-Thinking", + "display_name": "THUDM/GLM-4.1V-9B-Thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "Pro/THUDM/GLM-4.1V-9B-Thinking", + "name": "Pro/THUDM/GLM-4.1V-9B-Thinking", + "display_name": "Pro/THUDM/GLM-4.1V-9B-Thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "moonshotai/Kimi-Dev-72B", + "name": "moonshotai/Kimi-Dev-72B", + "display_name": "moonshotai/Kimi-Dev-72B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "MiniMaxAI/MiniMax-M1-80k", + "name": "MiniMaxAI/MiniMax-M1-80k", + "display_name": "MiniMaxAI/MiniMax-M1-80k", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "Tongyi-Zhiwen/QwenLong-L1-32B", + "name": "Tongyi-Zhiwen/QwenLong-L1-32B", + "display_name": "Tongyi-Zhiwen/QwenLong-L1-32B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", + "name": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", + "display_name": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-30B-A3B", + "name": "Qwen/Qwen3-30B-A3B", + "display_name": "Qwen/Qwen3-30B-A3B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-Reranker-8B", + "name": "Qwen/Qwen3-Reranker-8B", + "display_name": "Qwen/Qwen3-Reranker-8B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "score" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "rerank" + }, + { + "id": "Qwen/Qwen3-Embedding-8B", + "name": "Qwen/Qwen3-Embedding-8B", + "display_name": "Qwen/Qwen3-Embedding-8B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "embedding" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "Qwen/Qwen3-Reranker-4B", + "name": "Qwen/Qwen3-Reranker-4B", + "display_name": "Qwen/Qwen3-Reranker-4B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "score" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "rerank" + }, + { + "id": "Qwen/Qwen3-Embedding-4B", + "name": "Qwen/Qwen3-Embedding-4B", + "display_name": "Qwen/Qwen3-Embedding-4B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "embedding" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "Qwen/Qwen3-Reranker-0.6B", + "name": "Qwen/Qwen3-Reranker-0.6B", + "display_name": "Qwen/Qwen3-Reranker-0.6B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "score" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "rerank" + }, + { + "id": "Qwen/Qwen3-Embedding-0.6B", + "name": "Qwen/Qwen3-Embedding-0.6B", + "display_name": "Qwen/Qwen3-Embedding-0.6B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "embedding" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "Qwen/Qwen3-235B-A22B", + "name": "Qwen/Qwen3-235B-A22B", + "display_name": "Qwen/Qwen3-235B-A22B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, + { + "id": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", + "name": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", + "display_name": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "Qwen/QVQ-72B-Preview", + "name": "Qwen/QVQ-72B-Preview", + "display_name": "Qwen/QVQ-72B-Preview", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "deepseek-ai/DeepSeek-V2.5", + "name": "deepseek-ai/DeepSeek-V2.5", + "display_name": "deepseek-ai/DeepSeek-V2.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "fnlp/MOSS-TTSD-v0.5", + "name": "fnlp/MOSS-TTSD-v0.5", + "display_name": "fnlp/MOSS-TTSD-v0.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "FunAudioLLM/CosyVoice2-0.5B", + "name": "FunAudioLLM/CosyVoice2-0.5B", + "display_name": "FunAudioLLM/CosyVoice2-0.5B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "FunAudioLLM/SenseVoiceSmall", + "name": "FunAudioLLM/SenseVoiceSmall", + "display_name": "FunAudioLLM/SenseVoiceSmall", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "IndexTeam/IndexTTS-2", + "name": "IndexTeam/IndexTTS-2", + "display_name": "IndexTeam/IndexTTS-2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "BAAI/bge-m3", + "name": "BAAI/bge-m3", + "display_name": "BAAI/bge-m3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "BAAI/bge-reranker-v2-m3", + "name": "BAAI/bge-reranker-v2-m3", + "display_name": "BAAI/bge-reranker-v2-m3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "score" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "rerank" + }, + { + "id": "netease-youdao/bce-embedding-base_v1", + "name": "netease-youdao/bce-embedding-base_v1", + "display_name": "netease-youdao/bce-embedding-base_v1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "embedding" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "netease-youdao/bce-reranker-base_v1", + "name": "netease-youdao/bce-reranker-base_v1", + "display_name": "netease-youdao/bce-reranker-base_v1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "score" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "Kwai-Kolors/Kolors", + "name": "Kwai-Kolors/Kolors", + "display_name": "Kwai-Kolors/Kolors", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "Qwen/Qwen2-VL-72B-Instruct", + "name": "Qwen/Qwen2-VL-72B-Instruct", + "display_name": "Qwen/Qwen2-VL-72B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2.5-Coder-7B-Instruct", + "name": "Qwen/Qwen2.5-Coder-7B-Instruct", + "display_name": "Qwen/Qwen2.5-Coder-7B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + } + }, + { + "id": "internlm/internlm2_5-7b-chat", + "name": "internlm/internlm2_5-7b-chat", + "display_name": "internlm/internlm2_5-7b-chat", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2-7B-Instruct", + "name": "Qwen/Qwen2-7B-Instruct", + "display_name": "Qwen/Qwen2-7B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "THUDM/glm-4-9b-chat", + "name": "THUDM/glm-4-9b-chat", + "display_name": "THUDM/glm-4-9b-chat", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "BAAI/bge-large-en-v1.5", + "name": "BAAI/bge-large-en-v1.5", + "display_name": "BAAI/bge-large-en-v1.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "BAAI/bge-large-zh-v1.5", + "name": "BAAI/bge-large-zh-v1.5", + "display_name": "BAAI/bge-large-zh-v1.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "LoRA/Qwen/Qwen2.5-32B-Instruct", + "name": "LoRA/Qwen/Qwen2.5-32B-Instruct", + "display_name": "LoRA/Qwen/Qwen2.5-32B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "LoRA/Qwen/Qwen2.5-14B-Instruct", + "name": "LoRA/Qwen/Qwen2.5-14B-Instruct", + "display_name": "LoRA/Qwen/Qwen2.5-14B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "name": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "display_name": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", + "name": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", + "display_name": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + } + }, + { + "id": "Pro/BAAI/bge-m3", + "name": "Pro/BAAI/bge-m3", + "display_name": "Pro/BAAI/bge-m3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "Pro/Qwen/Qwen2.5-7B-Instruct", + "name": "Pro/Qwen/Qwen2.5-7B-Instruct", + "display_name": "Pro/Qwen/Qwen2.5-7B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "Pro/BAAI/bge-reranker-v2-m3", + "name": "Pro/BAAI/bge-reranker-v2-m3", + "display_name": "Pro/BAAI/bge-reranker-v2-m3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "score" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "rerank" + }, + { + "id": "LoRA/Qwen/Qwen2.5-72B-Instruct", + "name": "LoRA/Qwen/Qwen2.5-72B-Instruct", + "display_name": "LoRA/Qwen/Qwen2.5-72B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "Pro/Qwen/Qwen2-7B-Instruct", + "name": "Pro/Qwen/Qwen2-7B-Instruct", + "display_name": "Pro/Qwen/Qwen2-7B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "LoRA/Qwen/Qwen2.5-7B-Instruct", + "name": "LoRA/Qwen/Qwen2.5-7B-Instruct", + "display_name": "LoRA/Qwen/Qwen2.5-7B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "Pro/THUDM/glm-4-9b-chat", + "name": "Pro/THUDM/glm-4-9b-chat", + "display_name": "Pro/THUDM/glm-4-9b-chat", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "THUDM/GLM-Z1-Rumination-32B-0414", + "name": "THUDM/GLM-Z1-Rumination-32B-0414", + "display_name": "THUDM/GLM-Z1-Rumination-32B-0414", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "stabilityai/stable-diffusion-xl-base-1.0", + "name": "stabilityai/stable-diffusion-xl-base-1.0", + "display_name": "stabilityai/stable-diffusion-xl-base-1.0", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "black-forest-labs/FLUX.1-schnell", + "name": "black-forest-labs/FLUX.1-schnell", + "display_name": "black-forest-labs/FLUX.1-schnell", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] }, - "type": "chat" + "tool_call": false, + "reasoning": { + "supported": false + } }, { - "id": "phi-4", - "name": "Phi-4", - "display_name": "Phi-4", + "id": "black-forest-labs/FLUX.1-dev", + "name": "black-forest-labs/FLUX.1-dev", + "display_name": "black-forest-labs/FLUX.1-dev", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, - "limit": { - "context": 128000, - "output": 4096 - }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", - "cost": { - "input": 0.125, - "output": 0.5 - }, - "type": "chat" + } }, { - "id": "gpt-3.5-turbo-0613", - "name": "GPT-3.5 Turbo 0613", - "display_name": "GPT-3.5 Turbo 0613", + "id": "Pro/black-forest-labs/FLUX.1-schnell", + "name": "Pro/black-forest-labs/FLUX.1-schnell", + "display_name": "Pro/black-forest-labs/FLUX.1-schnell", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, - "limit": { - "context": 16384, - "output": 16384 - }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-06-13", - "last_updated": "2023-06-13", - "cost": { - "input": 3, - "output": 4 - }, - "type": "chat" + } }, { - "id": "phi-3-medium-128k-instruct", - "name": "Phi-3-medium-instruct (128k)", - "display_name": "Phi-3-medium-instruct (128k)", + "id": "stabilityai/stable-diffusion-3-5-large", + "name": "stabilityai/stable-diffusion-3-5-large", + "display_name": "stabilityai/stable-diffusion-3-5-large", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, - "limit": { - "context": 128000, - "output": 4096 - }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", - "cost": { - "input": 0.17, - "output": 0.68 - }, - "type": "chat" + } }, { - "id": "deepseek-v3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "fishaudio/fish-speech-1.4", + "name": "fishaudio/fish-speech-1.4", + "display_name": "fishaudio/fish-speech-1.4", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, - "limit": { - "context": 128000, - "output": 128000 - }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", - "cost": { - "input": 0.58, - "output": 1.68 - }, - "type": "chat" + "supported": false + } }, { - "id": "phi-3-small-128k-instruct", - "name": "Phi-3-small-instruct (128k)", - "display_name": "Phi-3-small-instruct (128k)", + "id": "RVC-Boss/GPT-SoVITS", + "name": "RVC-Boss/GPT-SoVITS", + "display_name": "RVC-Boss/GPT-SoVITS", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, - "limit": { - "context": 128000, - "output": 4096 - }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", - "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" + } }, { - "id": "gpt-3.5-turbo-0301", - "name": "GPT-3.5 Turbo 0301", - "display_name": "GPT-3.5 Turbo 0301", + "id": "fishaudio/fish-speech-1.5", + "name": "fishaudio/fish-speech-1.5", + "display_name": "fishaudio/fish-speech-1.5", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, - "limit": { - "context": 4096, - "output": 4096 - }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false + } + }, + { + "id": "black-forest-labs/FLUX.1-pro", + "name": "black-forest-labs/FLUX.1-pro", + "display_name": "black-forest-labs/FLUX.1-pro", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] }, - "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-03-01", - "last_updated": "2023-03-01", - "cost": { - "input": 1.5, - "output": 2 + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "LoRA/black-forest-labs/FLUX.1-dev", + "name": "LoRA/black-forest-labs/FLUX.1-dev", + "display_name": "LoRA/black-forest-labs/FLUX.1-dev", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] }, - "type": "chat" + "tool_call": false, + "reasoning": { + "supported": false + } }, { - "id": "phi-4-mini", - "name": "Phi-4-mini", - "display_name": "Phi-4-mini", + "id": "SeedLLM/Seed-Rice-7B", + "name": "SeedLLM/Seed-Rice-7B", + "display_name": "SeedLLM/Seed-Rice-7B", "modalities": { "input": [ "text" @@ -95720,43 +103644,41 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", - "cost": { - "input": 0.075, - "output": 0.3 - }, "type": "chat" - }, + } + ] + }, + "nvidia": { + "id": "nvidia", + "name": "Nvidia", + "display_name": "Nvidia", + "api": "https://integrate.api.nvidia.com/v1", + "doc": "https://docs.api.nvidia.com/nim/", + "models": [ { - "id": "gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "deepseek-ai/deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 163840, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -95764,41 +103686,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta-llama-3-8b-instruct", - "name": "Meta-Llama-3-8B-Instruct", - "display_name": "Meta-Llama-3-8B-Instruct", + "id": "deepseek-ai/deepseek-v3.1-terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ "text" @@ -95808,29 +103713,30 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 0.3, - "output": 0.61 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "bytedance/seed-oss-36b-instruct", + "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", "modalities": { "input": [ "text" @@ -95840,29 +103746,33 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", + "release_date": "2025-09-04", + "last_updated": "2025-11-25", "cost": { - "input": 60, - "output": 120 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "phi-4-mini-reasoning", - "name": "Phi-4-mini-reasoning", - "display_name": "Phi-4-mini-reasoning", + "id": "moonshotai/kimi-k2-instruct-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -95872,30 +103782,29 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.075, - "output": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta-llama-3.1-70b-instruct", - "name": "Meta-Llama-3.1-70B-Instruct", - "display_name": "Meta-Llama-3.1-70B-Instruct", + "id": "moonshotai/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -95906,28 +103815,29 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": false, + "knowledge": "2024-01", + "release_date": "2025-01-01", + "last_updated": "2025-09-05", "cost": { - "input": 2.68, - "output": 3.54 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "phi-3-mini-4k-instruct", - "name": "Phi-3-mini-instruct (4k)", - "display_name": "Phi-3-mini-instruct (4k)", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -95937,40 +103847,56 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2025-07", + "release_date": "2025-11", + "last_updated": "2025-12", "cost": { - "input": 0.13, - "output": 0.52 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "deepseek-v3.1", - "name": "DeepSeek-V3.1", - "display_name": "DeepSeek-V3.1", + "id": "moonshotai/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -95978,21 +103904,32 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.56, - "output": 1.68 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "text-embedding-3-small", - "name": "text-embedding-3-small", - "display_name": "text-embedding-3-small", + "id": "z-ai/glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -96002,27 +103939,40 @@ ] }, "limit": { - "context": 8191, - "output": 1536 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.02, + "input": 0, "output": 0 }, - "type": "embedding" + "type": "chat" }, { - "id": "gpt-3.5-turbo-1106", - "name": "GPT-3.5 Turbo 1106", - "display_name": "GPT-3.5 Turbo 1106", + "id": "z-ai/glm4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -96032,320 +103982,277 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 204800, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-11-06", - "last_updated": "2023-11-06", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 1, - "output": 2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "model-router", - "name": "Model Router", - "display_name": "Model Router", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-19", - "last_updated": "2025-11-18", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.14, + "input": 0, "output": 0 }, "type": "chat" }, { - "id": "mistral-small-2503", - "name": "Mistral Small 3.1", - "display_name": "Mistral Small 3.1", + "id": "openai/whisper-large-v3", + "name": "Whisper Large v3", + "display_name": "Whisper Large v3", "modalities": { "input": [ - "text", - "image" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 8192, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "attachment": false, + "open_weights": true, + "knowledge": "2023-09", + "release_date": "2023-09-01", + "last_updated": "2025-09-05", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "o1", - "name": "o1", - "display_name": "o1", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS-120B", + "display_name": "GPT-OSS-120B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "knowledge": "2025-08", + "release_date": "2025-08-04", + "last_updated": "2025-08-14", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-4-fast-reasoning", - "name": "Grok 4 Fast (Reasoning)", - "display_name": "Grok 4 Fast (Reasoning)", + "id": "black-forest-labs/flux_1-kontext-dev", + "name": "FLUX.1-Kontext-dev", + "display_name": "FLUX.1-Kontext-dev", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 40960, + "output": 40960 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "open_weights": true, + "release_date": "2025-08-12", + "last_updated": "2025-08-12", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "black-forest-labs/flux_1-schnell", + "name": "FLUX.1-schnell", + "display_name": "FLUX.1-schnell", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "image", - "audio" + "image" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 77, + "output": 8192 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2024-08-01", + "last_updated": "2026-02-04", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "cohere-embed-v3-multilingual", - "name": "Embed v3 Multilingual", - "display_name": "Embed v3 Multilingual", + "id": "black-forest-labs/flux.1-dev", + "name": "FLUX.1-dev", + "display_name": "FLUX.1-dev", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 512, - "output": 1024 + "context": 4096, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-08-01", + "last_updated": "2025-09-05", "cost": { - "input": 0.1, + "input": 0, "output": 0 }, "type": "chat" }, { - "id": "o1-preview", - "name": "o1-preview", - "display_name": "o1-preview", + "id": "black-forest-labs/flux_2-klein-4b", + "name": "FLUX.2 Klein 4B", + "display_name": "FLUX.2 Klein 4B", "modalities": { "input": [ + "image", "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 40960, + "output": 40960 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2026-01-14", + "last_updated": "2026-01-31", "cost": { - "input": 16.5, - "output": 66, - "cache_read": 8.25 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-0125", - "name": "GPT-3.5 Turbo 0125", - "display_name": "GPT-3.5 Turbo 0125", + "id": "nvidia/usdvalidate", + "name": "usdvalidate", + "display_name": "usdvalidate", "modalities": { "input": [ "text" @@ -96355,89 +104262,63 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 8192, + "output": 4096 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "open_weights": true, + "release_date": "2024-07-24", + "last_updated": "2025-01-08", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex Mini", - "display_name": "GPT-5.1 Codex Mini", + "id": "nvidia/magpie-tts-zeroshot", + "name": "magpie-tts-zeroshot", + "display_name": "magpie-tts-zeroshot", "modalities": { "input": [ "text", - "image" + "audio" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 4096 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "attachment": true, + "open_weights": true, + "release_date": "2025-05-22", + "last_updated": "2025-06-12", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "cohere-embed-v-4-0", - "name": "Embed v4", - "display_name": "Embed v4", + "id": "nvidia/gliner-pii", + "name": "gliner-pii", + "display_name": "gliner-pii", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -96445,87 +104326,61 @@ }, "limit": { "context": 128000, - "output": 1536 + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.12, + "input": 0, "output": 0 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "nvidia/active-speaker-detection", + "name": "Active Speaker Detection", + "display_name": "Active Speaker Detection", "modalities": { "input": [ - "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 4096 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-4-turbo-vision", - "name": "GPT-4 Turbo Vision", - "display_name": "GPT-4 Turbo Vision", + "id": "nvidia/sparsedrive", + "name": "sparsedrive", + "display_name": "sparsedrive", "modalities": { "input": [ - "text", - "image" + "video" ], "output": [ "text" @@ -96533,66 +104388,59 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "open_weights": true, + "release_date": "2025-03-18", + "last_updated": "2025-07-20", "cost": { - "input": 10, - "output": 30 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.1-chat", - "name": "GPT-5.1 Chat", - "display_name": "GPT-5.1 Chat", + "id": "nvidia/nemotron-content-safety-reasoning-4b", + "name": "nemotron-content-safety-reasoning-4b", + "display_name": "nemotron-content-safety-reasoning-4b", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "attachment": false, + "open_weights": true, + "release_date": "2026-01-22", + "last_updated": "2026-01-22", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta-llama-3.1-405b-instruct", - "name": "Meta-Llama-3.1-405B-Instruct", - "display_name": "Meta-Llama-3.1-405B-Instruct", + "id": "nvidia/nv-embed-v1", + "name": "nv-embed-v1", + "display_name": "nv-embed-v1", "modalities": { "input": [ "text" @@ -96602,62 +104450,61 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 32768, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2024-06-07", + "last_updated": "2025-07-22", "cost": { - "input": 5.33, - "output": 16 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "llama-3.2-11b-vision-instruct", - "name": "Llama-3.2-11B-Vision-Instruct", - "display_name": "Llama-3.2-11B-Vision-Instruct", + "id": "nvidia/cosmos-transfer1-7b", + "name": "cosmos-transfer1-7b", + "display_name": "cosmos-transfer1-7b", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 8192, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "release_date": "2025-06-13", + "last_updated": "2025-06-30", "cost": { - "input": 0.37, - "output": 0.37 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "cohere-command-a", - "name": "Command A", - "display_name": "Command A", + "id": "nvidia/nv-embedcode-7b-v1", + "name": "nv-embedcode-7b-v1", + "display_name": "nv-embedcode-7b-v1", "modalities": { "input": [ "text" @@ -96667,30 +104514,28 @@ ] }, "limit": { - "context": 256000, - "output": 8000 + "context": 32768, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "release_date": "2025-03-17", + "last_updated": "2025-05-29", "cost": { - "input": 2.5, - "output": 10 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mistral-large-2411", - "name": "Mistral Large 24.11", - "display_name": "Mistral Large 24.11", + "id": "nvidia/nvidia-nemotron-nano-9b-v2", + "name": "nvidia-nemotron-nano-9b-v2", + "display_name": "nvidia-nemotron-nano-9b-v2", "modalities": { "input": [ "text" @@ -96700,201 +104545,162 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, + "open_weights": true, "knowledge": "2024-09", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "release_date": "2025-08-18", + "last_updated": "2025-08-18", "cost": { - "input": 2, - "output": 6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "nvidia/cosmos-predict1-5b", + "name": "cosmos-predict1-5b", + "display_name": "cosmos-predict1-5b", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 4096 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "open_weights": true, + "release_date": "2025-03-18", + "last_updated": "2025-03-18", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.125 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-v3.2-speciale", - "name": "DeepSeek-V3.2-Speciale", - "display_name": "DeepSeek-V3.2-Speciale", + "id": "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning", + "name": "Nemotron 3 Nano Omni", + "display_name": "Nemotron 3 Nano Omni", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 256000, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2026-04-28", + "last_updated": "2026-04-28", "cost": { - "input": 0.58, - "output": 1.68 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "nvidia/synthetic-video-detector", + "name": "synthetic-video-detector", + "display_name": "synthetic-video-detector", "modalities": { "input": [ - "text" + "video" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 8192, + "output": 4096 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 1.35, - "output": 5.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "llama-3.2-90b-vision-instruct", - "name": "Llama-3.2-90B-Vision-Instruct", - "display_name": "Llama-3.2-90B-Vision-Instruct", + "id": "nvidia/nemotron-3-super-120b-a12b", + "name": "Nemotron 3 Super", + "display_name": "Nemotron 3 Super", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2024-04", + "release_date": "2026-03-11", + "last_updated": "2026-03-11", "cost": { - "input": 2.04, - "output": 2.04 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "text-embedding-ada-002", - "name": "text-embedding-ada-002", - "display_name": "text-embedding-ada-002", + "id": "nvidia/studiovoice", + "name": "studiovoice", + "display_name": "studiovoice", "modalities": { "input": [ "text" @@ -96904,83 +104710,59 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 128000, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2022-12-15", - "last_updated": "2022-12-15", + "open_weights": true, + "release_date": "2024-10-03", + "last_updated": "2025-06-13", "cost": { - "input": 0.1, + "input": 0, "output": 0 }, - "type": "embedding" + "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "nvidia/rerank-qa-mistral-4b", + "name": "rerank-qa-mistral-4b", + "display_name": "rerank-qa-mistral-4b", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 4096 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "open_weights": true, + "release_date": "2024-03-17", + "last_updated": "2025-01-17", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "phi-3-small-8k-instruct", - "name": "Phi-3-small-instruct (8k)", - "display_name": "Phi-3-small-instruct (8k)", + "id": "nvidia/llama-3_1-nemotron-safety-guard-8b-v3", + "name": "llama-3.1-nemotron-safety-guard-8b-v3", + "display_name": "llama-3.1-nemotron-safety-guard-8b-v3", "modalities": { "input": [ "text" @@ -96990,29 +104772,28 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 4096 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "release_date": "2025-10-28", + "last_updated": "2025-10-28", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta-llama-3-70b-instruct", - "name": "Meta-Llama-3-70B-Instruct", - "display_name": "Meta-Llama-3-70B-Instruct", + "id": "nvidia/llama-3_3-nemotron-super-49b-v1_5", + "name": "Llama 3.3 Nemotron Super 49B v1.5", + "display_name": "Llama 3.3 Nemotron Super 49B v1.5", "modalities": { "input": [ "text" @@ -97022,141 +104803,94 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 2.68, - "output": 3.54 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "nvidia/streampetr", + "name": "streampetr", + "display_name": "streampetr", "modalities": { "input": [ - "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "nvidia/cosmos-transfer2_5-2b", + "name": "cosmos-transfer2.5-2b", + "display_name": "cosmos-transfer2.5-2b", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 8192, + "output": 4096 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "phi-4-reasoning", - "name": "Phi-4-reasoning", - "display_name": "Phi-4-reasoning", + "id": "nvidia/usdcode", + "name": "usdcode", + "display_name": "usdcode", "modalities": { "input": [ "text" @@ -97166,33 +104900,32 @@ ] }, "limit": { - "context": 32000, + "context": 128000, "output": 4096 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": false, + "release_date": "2026-01-01", + "last_updated": "2026-01-01", "cost": { - "input": 0.125, - "output": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "phi-3-mini-128k-instruct", - "name": "Phi-3-mini-instruct (128k)", - "display_name": "Phi-3-mini-instruct (128k)", + "id": "nvidia/nemotron-voicechat", + "name": "nemotron-voicechat", + "display_name": "nemotron-voicechat", "modalities": { "input": [ - "text" + "text", + "audio" ], "output": [ "text" @@ -97200,28 +104933,27 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0.13, - "output": 0.52 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "text-embedding-3-large", - "name": "text-embedding-3-large", - "display_name": "text-embedding-3-large", + "id": "nvidia/llama-3_2-nemoretriever-300m-embed-v1", + "name": "llama-3_2-nemoretriever-300m-embed-v1", + "display_name": "llama-3_2-nemoretriever-300m-embed-v1", "modalities": { "input": [ "text" @@ -97231,30 +104963,32 @@ ] }, "limit": { - "context": 8191, - "output": 3072 + "context": 32768, + "output": 2048 }, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "open_weights": true, + "release_date": "2025-07-24", + "last_updated": "2025-07-24", "cost": { - "input": 0.13, + "input": 0, "output": 0 }, - "type": "embedding" + "type": "chat" }, { - "id": "o1-mini", - "name": "o1-mini", - "display_name": "o1-mini", + "id": "nvidia/llama-nemotron-rerank-vl-1b-v2", + "name": "llama-nemotron-rerank-vl-1b-v2", + "display_name": "llama-nemotron-rerank-vl-1b-v2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -97262,47 +104996,30 @@ }, "limit": { "context": 128000, - "output": 65536 + "output": 4096 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "attachment": true, + "open_weights": true, + "release_date": "2026-03-31", + "last_updated": "2026-03-31", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "phi-3.5-moe-instruct", - "name": "Phi-3.5-MoE-instruct", - "display_name": "Phi-3.5-MoE-instruct", + "id": "nvidia/bevformer", + "name": "bevformer", + "display_name": "bevformer", "modalities": { "input": [ - "text" + "video" ], "output": [ "text" @@ -97310,63 +105027,60 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "release_date": "2025-03-18", + "last_updated": "2025-07-20", "cost": { - "input": 0.16, - "output": 0.64 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5-chat", - "name": "GPT-5 Chat", - "display_name": "GPT-5 Chat", + "id": "nvidia/llama-3_3-nemotron-super-49b-v1", + "name": "Llama 3.3 Nemotron Super 49B v1", + "display_name": "Llama 3.3 Nemotron Super 49B v1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10-24", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-04-07", + "last_updated": "2025-04-07", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-v3-0324", - "name": "DeepSeek-V3-0324", - "display_name": "DeepSeek-V3-0324", + "id": "nvidia/riva-translate-4b-instruct-v1_1", + "name": "riva-translate-4b-instruct-v1_1", + "display_name": "riva-translate-4b-instruct-v1_1", "modalities": { "input": [ "text" @@ -97376,29 +105090,28 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "release_date": "2025-12-12", + "last_updated": "2025-12-12", "cost": { - "input": 1.14, - "output": 4.56 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "nvidia/nemotron-3-content-safety", + "name": "nemotron-3-content-safety", + "display_name": "nemotron-3-content-safety", "modalities": { "input": [ "text" @@ -97409,28 +105122,27 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.71, - "output": 0.71 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "nvidia/llama-nemotron-embed-vl-1b-v2", + "name": "llama-nemotron-embed-vl-1b-v2", + "display_name": "llama-nemotron-embed-vl-1b-v2", "modalities": { "input": [ "text", @@ -97441,41 +105153,28 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 32768, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-06", - "last_updated": "2026-02-06", + "release_date": "2026-02-10", + "last_updated": "2026-02-10", "cost": { - "input": 0.6, - "output": 3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta-llama-3.1-8b-instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", + "id": "nvidia/nemotron-3-nano-30b-a3b", + "name": "nemotron-3-nano-30b-a3b", + "display_name": "nemotron-3-nano-30b-a3b", "modalities": { "input": [ "text" @@ -97485,29 +105184,30 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2024-09", + "release_date": "2024-12", + "last_updated": "2024-12", "cost": { - "input": 0.3, - "output": 0.61 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "ministral-3b", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "nvidia/nemotron-mini-4b-instruct", + "name": "nemotron-mini-4b-instruct", + "display_name": "nemotron-mini-4b-instruct", "modalities": { "input": [ "text" @@ -97527,19 +105227,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-03", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2024-08-21", + "last_updated": "2024-08-26", "cost": { - "input": 0.04, - "output": 0.04 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "phi-3-medium-4k-instruct", - "name": "Phi-3-medium-instruct (4k)", - "display_name": "Phi-3-medium-instruct (4k)", + "id": "mistralai/mixtral-8x7b-instruct", + "name": "Mistral: Mixtral 8x7B Instruct", + "display_name": "Mistral: Mixtral 8x7B Instruct", "modalities": { "input": [ "text" @@ -97549,62 +105248,59 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 32768, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "release_date": "2023-12-10", + "last_updated": "2026-03-15", "cost": { - "input": 0.17, - "output": 0.68 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout 17B 16E Instruct", - "display_name": "Llama 4 Scout 17B 16E Instruct", + "id": "mistralai/mistral-7b-instruct-v03", + "name": "Mistral-7B-Instruct-v0.3", + "display_name": "Mistral-7B-Instruct-v0.3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2025-04-01", + "last_updated": "2025-04-01", "cost": { - "input": 0.2, - "output": 0.78 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "phi-3.5-mini-instruct", - "name": "Phi-3.5-mini-instruct", - "display_name": "Phi-3.5-mini-instruct", + "id": "mistralai/mistral-small-4-119b-2603", + "name": "mistral-small-4-119b-2603", + "display_name": "mistral-small-4-119b-2603", "modalities": { "input": [ "text" @@ -97615,63 +105311,60 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0.13, - "output": 0.52 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "phi-4-multimodal", - "name": "Phi-4-multimodal", - "display_name": "Phi-4-multimodal", + "id": "mistralai/mistral-large-3-675b-instruct-2512", + "name": "Mistral Large 3 675B Instruct 2512", + "display_name": "Mistral Large 3 675B Instruct 2512", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2025-01", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0.08, - "output": 0.32, - "input_audio": 4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "codex-mini", - "name": "Codex Mini", - "display_name": "Codex Mini", + "id": "mistralai/mixtral-8x22b-instruct", + "name": "Mistral: Mixtral 8x22B Instruct", + "display_name": "Mistral: Mixtral 8x22B Instruct", "modalities": { "input": [ "text" @@ -97681,66 +105374,28 @@ ] }, "limit": { - "context": 200000, - "output": 100000 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-16", - "last_updated": "2025-05-16", - "cost": { - "input": 1.5, - "output": 6, - "cache_read": 0.375 - }, - "type": "chat" - }, - { - "id": "gpt-5.2-chat", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 16384 + "context": 65536, + "output": 13108 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "release_date": "2024-04-17", + "last_updated": "2024-04-17", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "mistralai/magistral-small-2506", + "name": "Magistral Small 2506", + "display_name": "Magistral Small 2506", "modalities": { "input": [ "text" @@ -97750,266 +105405,168 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 32768, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "open_weights": false, + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 Mini", - "display_name": "GPT-5.4 Mini", + "id": "mistralai/mistral-medium-3-instruct", + "name": "Mistral Medium 3", + "display_name": "Mistral Medium 3", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 32768 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.4-nano", - "name": "GPT-5.4 Nano", - "display_name": "GPT-5.4 Nano", + "id": "mistralai/devstral-2-123b-instruct-2512", + "name": "Devstral-2-123B-Instruct-2512", + "display_name": "Devstral-2-123B-Instruct-2512", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-08", + "last_updated": "2025-12-09", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.4-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "mistralai/mistral-nemotron", + "name": "mistral-nemotron", + "display_name": "mistral-nemotron", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-06-11", + "last_updated": "2025-06-12", "cost": { - "input": 30, - "output": 180, - "context_over_200k": { - "input": 60, - "output": 270 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "qwen/qwen3.5-122b-a10b", + "name": "Qwen3.5 122B-A10B", + "display_name": "Qwen3.5 122B-A10B", "modalities": { "input": [ "text", "image", - "pdf" + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "open_weights": true, + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-4-fast-non-reasoning", - "name": "Grok 4 Fast (Non-Reasoning)", - "display_name": "Grok 4 Fast (Non-Reasoning)", + "id": "qwen/qwen3.5-397b-a17b", + "name": "Qwen3.5-397B-A17B", + "display_name": "Qwen3.5-397B-A17B", "modalities": { "input": [ "text", @@ -98020,30 +105577,41 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 262144, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "open_weights": true, + "knowledge": "2026-01", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen3-Next-80B-A3B-Thinking", + "display_name": "Qwen3-Next-80B-A3B-Thinking", "modalities": { "input": [ "text" @@ -98053,98 +105621,104 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "qwen/qwen-image-edit", + "name": "Qwen Image Edit", + "display_name": "Qwen Image Edit", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-08-19", + "last_updated": "2025-08-19", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0, + "output": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "qwen/qwen2.5-coder-32b-instruct", + "name": "Qwen2.5 Coder 32b Instruct", + "display_name": "Qwen2.5 Coder 32b Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "release_date": "2024-11-06", + "last_updated": "2024-11-06", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "cohere-command-r-plus-08-2024", - "name": "Command R+", - "display_name": "Command R+", + "id": "qwen/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -98154,8 +105728,8 @@ ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 262144, + "output": 66536 }, "temperature": true, "tool_call": true, @@ -98163,31 +105737,30 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 2.5, - "output": 10 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "qwen/qwen3-next-80b-a3b-instruct", + "name": "Qwen3-Next-80B-A3B-Instruct", + "display_name": "Qwen3-Next-80B-A3B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 262144, "output": 16384 }, "temperature": true, @@ -98195,71 +105768,53 @@ "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5-pro", - "name": "GPT-5 Pro", - "display_name": "GPT-5 Pro", + "id": "qwen/qwen-image", + "name": "Qwen Image", + "display_name": "Qwen Image", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 400000, - "output": 272000 + "context": 8192, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 15, - "output": 120 + "input": 0, + "output": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "google/gemma-3-27b-it", + "name": "Gemma-3-27B-IT", + "display_name": "Gemma-3-27B-IT", "modalities": { "input": [ "text", @@ -98270,56 +105825,43 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "google/gemma-4-31b-it", + "name": "Gemma-4-31B-IT", + "display_name": "Gemma-4-31B-IT", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -98327,23 +105869,21 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.3, - "output": 0.5, - "reasoning": 0.5, - "cache_read": 0.075 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "google/gemma-3n-e2b-it", + "name": "Gemma 3n E2b It", + "display_name": "Gemma 3n E2b It", "modalities": { "input": [ "text", @@ -98354,8 +105894,8 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -98363,61 +105903,53 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2025-06-12", + "last_updated": "2025-06-12", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.03 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "google/gemma-3n-e4b-it", + "name": "Gemma 3n E4b It", + "display_name": "Gemma 3n E4b It", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "attachment": true, + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2025-06-03", + "last_updated": "2025-06-03", "cost": { - "input": 3, - "output": 15, - "reasoning": 15, - "cache_read": 0.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "google/gemma-2-2b-it", + "name": "Gemma 2 2b It", + "display_name": "Gemma 2 2b It", "modalities": { "input": [ "text" @@ -98427,133 +105959,95 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "open_weights": true, + "release_date": "2024-07-16", + "last_updated": "2024-07-16", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "google/google-paligemma", + "name": "paligemma", + "display_name": "paligemma", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "attachment": true, + "open_weights": true, + "release_date": "2024-05-14", + "last_updated": "2024-08-26", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "microsoft/phi-4-mini-instruct", + "name": "Phi-4-Mini", + "display_name": "Phi-4-Mini", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "cohere-command-r-08-2024", - "name": "Command R", - "display_name": "Command R", + "id": "microsoft/phi-4-multimodal-instruct", + "name": "Phi 4 Multimodal", + "display_name": "Phi 4 Multimodal", "modalities": { "input": [ "text" @@ -98564,32 +106058,29 @@ }, "limit": { "context": 128000, - "output": 4000 + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "open_weights": false, + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "upstage/solar-10_7b-instruct", + "name": "solar-10.7b-instruct", + "display_name": "solar-10.7b-instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -98597,77 +106088,78 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "attachment": false, + "open_weights": true, + "release_date": "2024-06-05", + "last_updated": "2025-04-10", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "minimaxai/minimax-m2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 10, - "output": 30 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "minimaxai/minimax-m2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -98676,65 +106168,38 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-04-11", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "abliteration-ai": { - "id": "abliteration-ai", - "name": "abliteration.ai", - "display_name": "abliteration.ai", - "api": "https://api.abliteration.ai/v1", - "doc": "https://docs.abliteration.ai/models", - "models": [ + }, { - "id": "abliterated-model", - "name": "Abliterated Model", - "display_name": "Abliterated Model", + "id": "sarvamai/sarvam-m", + "name": "sarvam-m", + "display_name": "sarvam-m", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 150000, + "context": 128000, "output": 8192 }, "temperature": true, @@ -98742,28 +106207,20 @@ "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-01-06", - "last_updated": "2026-01-06", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 3, - "output": 3 + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "cohere": { - "id": "cohere", - "name": "Cohere", - "display_name": "Cohere", - "doc": "https://docs.cohere.com/docs/models", - "models": [ + }, { - "id": "command-a-reasoning-08-2025", - "name": "Command A Reasoning", - "display_name": "Command A Reasoning", + "id": "abacusai/dracarys-llama-3_1-70b-instruct", + "name": "dracarys-llama-3.1-70b-instruct", + "display_name": "dracarys-llama-3.1-70b-instruct", "modalities": { "input": [ "text" @@ -98773,30 +106230,28 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "release_date": "2024-09-11", + "last_updated": "2025-05-22", "cost": { - "input": 2.5, - "output": 10 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "command-r7b-12-2024", - "name": "Command R7B", - "display_name": "Command R7B", + "id": "baai/bge-m3", + "name": "BGE M3", + "display_name": "BGE M3", "modalities": { "input": [ "text" @@ -98806,57 +106261,59 @@ ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 8192, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-02-27", - "last_updated": "2024-02-27", + "release_date": "2024-01-30", + "last_updated": "2026-04-30", "cost": { - "input": 0.0375, - "output": 0.15 + "input": 0, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "c4ai-aya-vision-8b", - "name": "Aya Vision 8B", - "display_name": "Aya Vision 8B", + "id": "meta/llama-3.1-70b-instruct", + "name": "Llama 3.1 70b Instruct", + "display_name": "Llama 3.1 70b Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-03-04", - "last_updated": "2025-05-14", + "release_date": "2024-07-16", + "last_updated": "2024-07-16", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "command-r-plus-08-2024", - "name": "Command R+", - "display_name": "Command R+", + "id": "meta/esm2-650m", + "name": "esm2-650m", + "display_name": "esm2-650m", "modalities": { "input": [ "text" @@ -98867,55 +106324,60 @@ }, "limit": { "context": 128000, - "output": 4000 + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "release_date": "2024-08-29", + "last_updated": "2025-03-10", "cost": { - "input": 2.5, - "output": 10 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "c4ai-aya-expanse-8b", - "name": "Aya Expanse 8B", - "display_name": "Aya Expanse 8B", + "id": "meta/llama-3.2-90b-vision-instruct", + "name": "Llama-3.2-90B-Vision-Instruct", + "display_name": "Llama-3.2-90B-Vision-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8000, - "output": 4000 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2024-10-24", - "last_updated": "2024-10-24", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "command-r7b-arabic-02-2025", - "name": "Command R7B Arabic", - "display_name": "Command R7B Arabic", + "id": "meta/llama-3.2-1b-instruct", + "name": "Llama 3.2 1b Instruct", + "display_name": "Llama 3.2 1b Instruct", "modalities": { "input": [ "text" @@ -98926,7 +106388,7 @@ }, "limit": { "context": 128000, - "output": 4000 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -98935,23 +106397,22 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-02-27", - "last_updated": "2025-02-27", + "knowledge": "2023-12", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 0.0375, - "output": 0.15 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "command-a-vision-07-2025", - "name": "Command A Vision", - "display_name": "Command A Vision", + "id": "meta/esmfold", + "name": "esmfold", + "display_name": "esmfold", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -98959,7 +106420,7 @@ }, "limit": { "context": 128000, - "output": 8000 + "output": 8192 }, "temperature": true, "tool_call": false, @@ -98968,19 +106429,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-07-31", - "last_updated": "2025-07-31", + "release_date": "2024-03-15", + "last_updated": "2025-06-12", "cost": { - "input": 2.5, - "output": 10 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "c4ai-aya-vision-32b", - "name": "Aya Vision 32B", - "display_name": "Aya Vision 32B", + "id": "meta/llama-3.2-11b-vision-instruct", + "name": "Llama 3.2 11b Vision Instruct", + "display_name": "Llama 3.2 11b Vision Instruct", "modalities": { "input": [ "text", @@ -98991,56 +106451,62 @@ ] }, "limit": { - "context": 16000, - "output": 4000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": true, - "release_date": "2025-03-04", - "last_updated": "2025-05-14", + "knowledge": "2023-12", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "command-a-translate-08-2025", - "name": "Command A Translate", - "display_name": "Command A Translate", + "id": "meta/llama-4-maverick-17b-128e-instruct", + "name": "Llama 4 Maverick 17b 128e Instruct", + "display_name": "Llama 4 Maverick 17b 128e Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8000, - "output": 8000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "knowledge": "2024-02", + "release_date": "2025-04-01", + "last_updated": "2025-04-01", "cost": { - "input": 2.5, - "output": 10 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "command-r-08-2024", - "name": "Command R", - "display_name": "Command R", + "id": "meta/llama-3.3-70b-instruct", + "name": "Llama 3.3 70b Instruct", + "display_name": "Llama 3.3 70b Instruct", "modalities": { "input": [ "text" @@ -99051,7 +106517,7 @@ }, "limit": { "context": 128000, - "output": 4000 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -99060,19 +106526,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "release_date": "2024-11-26", + "last_updated": "2024-11-26", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "c4ai-aya-expanse-32b", - "name": "Aya Expanse 32B", - "display_name": "Aya Expanse 32B", + "id": "meta/llama-3.2-3b-instruct", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ "text" @@ -99082,8 +106547,8 @@ ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 32768, + "output": 32000 }, "temperature": true, "tool_call": false, @@ -99092,55 +106557,50 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-10-24", - "last_updated": "2024-10-24", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "command-a-03-2025", - "name": "Command A", - "display_name": "Command A", + "id": "meta/llama-guard-4-12b", + "name": "Llama Guard 4 12B", + "display_name": "Llama Guard 4 12B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8000 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "release_date": "2025-04-05", + "last_updated": "2026-04-30", "cost": { - "input": 2.5, - "output": 10 + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "cloudferro-sherlock": { - "id": "cloudferro-sherlock", - "name": "CloudFerro Sherlock", - "display_name": "CloudFerro Sherlock", - "api": "https://api-sherlock.cloudferro.com/openai/v1/", - "doc": "https://docs.sherlock.cloudferro.com/", - "models": [ - { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + }, + { + "id": "meta/llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ "text" @@ -99150,8 +106610,8 @@ ] }, "limit": { - "context": 70000, - "output": 70000 + "context": 16000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -99160,19 +106620,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-10-09", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 2.92, - "output": 2.92 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "OpenAI GPT OSS 120B", - "display_name": "OpenAI GPT OSS 120B", + "id": "stepfun-ai/step-3.5-flash", + "name": "Step 3.5 Flash", + "display_name": "Step 3.5 Flash", "modalities": { "input": [ "text" @@ -99182,8 +106642,8 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -99191,25 +106651,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": true, - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "release_date": "2026-02-02", + "last_updated": "2026-02-02", "cost": { - "input": 2.92, - "output": 2.92 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "speakleash/Bielik-11B-v3.0-Instruct", - "name": "Bielik 11B v3.0 Instruct", - "display_name": "Bielik 11B v3.0 Instruct", + "id": "deepseek-ai/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -99219,29 +106674,42 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.67, - "output": 0.67 + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "speakleash/Bielik-11B-v2.6-Instruct", - "name": "Bielik 11B v2.6 Instruct", - "display_name": "Bielik 11B v2.6 Instruct", + "id": "deepseek-ai/deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -99251,40 +106719,63 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.67, - "output": 0.67 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" - }, + } + ] + }, + "anthropic": { + "id": "anthropic", + "name": "Anthropic", + "display_name": "Anthropic", + "doc": "https://docs.anthropic.com/en/docs/about-claude/models", + "models": [ { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "claude-opus-4-1-20250805", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 196000, - "output": 16000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -99292,46 +106783,36 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.3, - "output": 1.2 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" - } - ] - }, - "kuae-cloud-coding-plan": { - "id": "kuae-cloud-coding-plan", - "name": "KUAE Cloud Coding Plan", - "display_name": "KUAE Cloud Coding Plan", - "api": "https://coding-plan-endpoint.kuaecloud.net/v1", - "doc": "https://docs.mthreads.com/kuaecloud/kuaecloud-doc-online/coding_plan/", - "models": [ + }, { - "id": "GLM-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -99341,87 +106822,74 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" - } - ] - }, - "xai": { - "id": "xai", - "name": "xai", - "display_name": "xai", - "doc": "https://docs.x.ai/docs/models", - "models": [ + }, { - "id": "grok-2-1212", - "name": "Grok 2 1212", - "display_name": "Grok 2 1212", + "id": "claude-3-haiku-20240307", + "name": "Claude Haiku 3", + "display_name": "Claude Haiku 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 120000, - "output": 100000 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": false - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-12-12", - "last_updated": "2024-12-12", + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "grok-vision-beta", - "name": "Grok Vision Beta", - "display_name": "Grok Vision Beta", + "id": "claude-3-sonnet-20240229", + "name": "Claude Sonnet 3", + "display_name": "Claude Sonnet 3", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, + "context": 200000, "output": 4096 }, "temperature": true, @@ -99431,110 +106899,106 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "knowledge": "2023-08-31", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", "cost": { - "input": 5, + "input": 3, "output": 15, - "cache_read": 5 + "cache_read": 0.3, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "grok-4.3", - "name": "Grok 4.3", - "display_name": "Grok 4.3", + "id": "claude-3-5-haiku-latest", + "name": "Claude Haiku 3.5 (latest)", + "display_name": "Claude Haiku 3.5 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 30000 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-05-01", - "last_updated": "2026-05-01", + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2, - "context_over_200k": { - "input": 2.5, - "output": 5, - "cache_read": 0.4 - } + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "grok-3-mini-fast", - "name": "Grok 3 Mini Fast", - "display_name": "Grok 3 Mini Fast", + "id": "claude-3-opus-20240229", + "name": "Claude Opus 3", + "display_name": "Claude Opus 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2023-08-31", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", "cost": { - "input": 0.6, - "output": 4, - "reasoning": 4, - "cache_read": 0.15 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "grok-3-mini-latest", - "name": "Grok 3 Mini Latest", - "display_name": "Grok 3 Mini Latest", + "id": "claude-haiku-4-5-20251001", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -99542,33 +107006,35 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.3, - "output": 0.5, - "reasoning": 0.5, - "cache_read": 0.075 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "grok-3-fast", - "name": "Grok 3 Fast", - "display_name": "Grok 3 Fast", + "id": "claude-3-5-sonnet-20240620", + "name": "Claude Sonnet 3.5", + "display_name": "Claude Sonnet 3.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 200000, "output": 8192 }, "temperature": true, @@ -99576,68 +107042,73 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2024-04-30", + "release_date": "2024-06-20", + "last_updated": "2024-06-20", "cost": { - "input": 5, - "output": 25, - "cache_read": 1.25 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "grok-2-vision-latest", - "name": "Grok 2 Vision Latest", - "display_name": "Grok 2 Vision Latest", + "id": "claude-opus-4-0", + "name": "Claude Opus 4 (latest)", + "display_name": "Claude Opus 4 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-20", - "last_updated": "2024-12-12", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "grok-4.20-0309-reasoning", - "name": "Grok 4.20 (Reasoning)", - "display_name": "Grok 4.20 (Reasoning)", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -99645,71 +107116,104 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-09", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 12, - "cache_read": 0.4 - } + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "Grok 4.1 Fast (Non-Reasoning)", - "display_name": "Grok 4.1 Fast (Non-Reasoning)", + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "grok-3-mini-fast-latest", - "name": "Grok 3 Mini Fast Latest", - "display_name": "Grok 3 Mini Fast Latest", + "id": "claude-sonnet-4-0", + "name": "Claude Sonnet 4 (latest)", + "display_name": "Claude Sonnet 4 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -99717,35 +107221,41 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.6, - "output": 4, - "reasoning": 4, - "cache_read": 0.15 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "grok-4-fast", - "name": "Grok 4 Fast", - "display_name": "Grok 4 Fast", + "id": "claude-opus-4-1", + "name": "Claude Opus 4.1 (latest)", + "display_name": "Claude Opus 4.1 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -99753,32 +107263,40 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "grok-3-latest", - "name": "Grok 3 Latest", - "display_name": "Grok 3 Latest", + "id": "claude-3-5-haiku-20241022", + "name": "Claude Haiku 3.5", + "display_name": "Claude Haiku 3.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 200000, "output": 8192 }, "temperature": true, @@ -99786,32 +107304,35 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "grok-2", - "name": "Grok 2", - "display_name": "Grok 2", + "id": "claude-3-5-sonnet-20241022", + "name": "Claude Sonnet 3.5 v2", + "display_name": "Claude Sonnet 3.5 v2", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 200000, "output": 8192 }, "temperature": true, @@ -99819,33 +107340,36 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "claude-opus-4-5-20251101", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -99853,294 +107377,425 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "knowledge": "2025-03-31", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "grok-4.20-0309-non-reasoning", - "name": "Grok 4.20 (Non-Reasoning)", - "display_name": "Grok 4.20 (Non-Reasoning)", + "id": "claude-opus-4-20250514", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-09", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 12, - "cache_read": 0.4 - } + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "grok-3-fast-latest", - "name": "Grok 3 Fast Latest", - "display_name": "Grok 3 Fast Latest", + "id": "claude-sonnet-4-5-20250929", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "type": "chat" + }, + { + "id": "claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { "input": 5, "output": 25, - "cache_read": 1.25 + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "grok-4.20-multi-agent-0309", - "name": "Grok 4.20 Multi-Agent", - "display_name": "Grok 4.20 Multi-Agent", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 1000000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-09", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 12, - "cache_read": 0.4 - } + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "claude-3-7-sonnet-20250219", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 200000, "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "knowledge": "2024-10-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { "input": 3, "output": 15, - "reasoning": 15, - "cache_read": 0.75 + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "grok-2-latest", - "name": "Grok 2 Latest", - "display_name": "Grok 2 Latest", + "id": "claude-sonnet-4-20250514", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-20", - "last_updated": "2024-12-12", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "grok-beta", - "name": "Grok Beta", - "display_name": "Grok Beta", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5 (latest)", + "display_name": "Claude Opus 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { "input": 5, - "output": 15, - "cache_read": 5 + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" - }, + } + ] + }, + "zhipuai-coding-plan": { + "id": "zhipuai-coding-plan", + "name": "Zhipu AI Coding Plan", + "display_name": "Zhipu AI Coding Plan", + "api": "https://open.bigmodel.cn/api/coding/paas/v4", + "doc": "https://docs.bigmodel.cn/cn/coding-plan/overview", + "models": [ { - "id": "grok-2-vision", - "name": "Grok 2 Vision", - "display_name": "Grok 2 Vision", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "grok-4-1-fast", - "name": "Grok 4.1 Fast", - "display_name": "Grok 4.1 Fast", + "id": "glm-5v-turbo", + "name": "GLM-5V-Turbo", + "display_name": "GLM-5V-Turbo", "modalities": { "input": [ "text", - "image" + "image", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -100148,22 +107803,33 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", - "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "release_date": "2026-04-01", + "last_updated": "2026-04-01", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -100173,8 +107839,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -100182,60 +107848,79 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.3, - "output": 0.5, - "reasoning": 0.5, - "cache_read": 0.075 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "grok-2-vision-1212", - "name": "Grok 2 Vision 1212", - "display_name": "Grok 2 Vision 1212", + "id": "glm-5-turbo", + "name": "GLM-5-Turbo", + "display_name": "GLM-5-Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 200000, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "search": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-20", - "last_updated": "2024-12-12", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ "text" @@ -100246,63 +107931,71 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "atomic-chat": { + "id": "atomic-chat", + "name": "Atomic Chat", + "display_name": "Atomic Chat", + "api": "http://127.0.0.1:1337/v1", + "doc": "https://atomic.chat", + "models": [ { - "id": "grok-4-fast-non-reasoning", - "name": "Grok 4 Fast (Non-Reasoning)", - "display_name": "Grok 4 Fast (Non-Reasoning)", + "id": "gemma-4-E4B-it-IQ4_XS", + "name": "Gemma 4 E4B Instruct (IQ4_XS)", + "display_name": "Gemma 4 E4B Instruct (IQ4_XS)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 32768, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-3-mini-fast-beta", - "name": "Grok 3 Mini Fast Beta", - "display_name": "Grok 3 Mini Fast Beta", + "id": "gemma-4-E4B-it-MLX-4bit", + "name": "Gemma 4 E4B Instruct (MLX 4-bit)", + "display_name": "Gemma 4 E4B Instruct (MLX 4-bit)", "modalities": { "input": [ "text" @@ -100312,55 +108005,60 @@ ] }, "limit": { - "context": 120000, - "output": 100000 + "context": 32768, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "effort": "low" - }, - "search": { "supported": false }, "attachment": false, + "open_weights": true, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "grok-3-mini-beta", - "name": "Grok 3 Mini Beta", - "display_name": "Grok 3 Mini Beta", + "id": "Qwen3_5-9B-Q4_K_M", + "name": "Qwen 3.5 9B (Q4_K_M)", + "display_name": "Qwen 3.5 9B (Q4_K_M)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 120000, - "output": 100000 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "effort": "low" - }, - "search": { "supported": false }, - "attachment": false, + "attachment": true, + "open_weights": true, + "release_date": "2026-03-05", + "last_updated": "2026-04-04", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "grok-3-fast-beta", - "name": "Grok 3 Fast Beta", - "display_name": "Grok 3 Fast Beta", + "id": "Meta-Llama-3_1-8B-Instruct-GGUF", + "name": "Meta Llama 3.1 8B Instruct (GGUF)", + "display_name": "Meta Llama 3.1 8B Instruct (GGUF)", "modalities": { "input": [ "text" @@ -100370,24 +108068,28 @@ ] }, "limit": { - "context": 120000, - "output": 100000 + "context": 131072, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": false - }, "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "grok-2-image-1212", - "name": "Grok 2 Image 1212", - "display_name": "Grok 2 Image 1212", + "id": "Qwen3_5-9B-MLX-4bit", + "name": "Qwen 3.5 9B (MLX 4-bit)", + "display_name": "Qwen 3.5 9B (MLX 4-bit)", "modalities": { "input": [ "text", @@ -100398,24 +108100,37 @@ ] }, "limit": { - "context": 130000, - "output": 100000 + "context": 32768, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": false + "attachment": true, + "open_weights": true, + "release_date": "2026-03-05", + "last_updated": "2026-04-04", + "cost": { + "input": 0, + "output": 0 }, - "attachment": false, "type": "chat" - }, + } + ] + }, + "github-models": { + "id": "github-models", + "name": "GitHub Models", + "display_name": "GitHub Models", + "api": "https://models.github.ai/inference", + "doc": "https://docs.github.com/en/github-models", + "models": [ { - "id": "grok-3-beta", - "name": "Grok 3 Beta", - "display_name": "Grok 3 Beta", + "id": "cohere/cohere-command-r-plus", + "name": "Cohere Command R+", + "display_name": "Cohere Command R+", "modalities": { "input": [ "text" @@ -100425,33 +108140,29 @@ ] }, "limit": { - "context": 120000, - "output": 100000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": false - }, "attachment": false, + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2024-04-04", + "last_updated": "2024-08-01", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" - } - ] - }, - "meganova": { - "id": "meganova", - "name": "Meganova", - "display_name": "Meganova", - "api": "https://api.meganova.ai/v1", - "doc": "https://docs.meganova.ai", - "models": [ + }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "cohere/cohere-command-r-plus-08-2024", + "name": "Cohere Command R+ 08-2024", + "display_name": "Cohere Command R+ 08-2024", "modalities": { "input": [ "text" @@ -100461,8 +108172,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -100470,32 +108181,31 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2024-08-01", + "last_updated": "2024-08-01", "cost": { - "input": 0.09, - "output": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-Plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "cohere/cohere-command-r", + "name": "Cohere Command R", + "display_name": "Cohere Command R", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -100503,65 +108213,53 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02", - "last_updated": "2026-02", + "knowledge": "2024-03", + "release_date": "2024-03-11", + "last_updated": "2024-08-01", "cost": { - "input": 0.4, - "output": 2.4, - "reasoning": 2.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-32B-Instruct", - "name": "Qwen2.5 VL 32B Instruct", - "display_name": "Qwen2.5 VL 32B Instruct", + "id": "cohere/cohere-command-r-08-2024", + "name": "Cohere Command R 08-2024", + "display_name": "Cohere Command R 08-2024", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "attachment": false, + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2024-08-01", + "last_updated": "2024-08-01", "cost": { - "input": 0.2, - "output": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "cohere/cohere-command-a", + "name": "Cohere Command A", + "display_name": "Cohere Command A", "modalities": { "input": [ "text" @@ -100571,8 +108269,8 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -100580,75 +108278,55 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "zai-org/GLM-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "attachment": true, + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0.8, - "output": 2.56 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "openai/o1-preview", + "name": "OpenAI o1-preview", + "display_name": "OpenAI o1-preview", "modalities": { "input": [ "text" @@ -100658,11 +108336,11 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 128000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -100670,29 +108348,32 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 0.45, - "output": 1.9 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mistralai/Mistral-Small-3.2-24B-Instruct-2506", - "name": "Mistral Small 3.2 24B Instruct", - "display_name": "Mistral Small 3.2 24B Instruct", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ "text", @@ -100703,8 +108384,8 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -100712,10 +108393,10 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-06-20", - "last_updated": "2025-06-20", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { "input": 0, "output": 0 @@ -100723,83 +108404,54 @@ "type": "chat" }, { - "id": "mistralai/Mistral-Nemo-Instruct-2407", - "name": "Mistral Nemo Instruct 2407", - "display_name": "Mistral Nemo Instruct 2407", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1-mini", + "display_name": "GPT-4.1-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", - "cost": { - "input": 0.02, - "output": 0.04 - }, - "type": "chat" - }, - { - "id": "XiaomiMiMo/MiMo-V2-Flash", - "name": "MiMo V2 Flash", - "display_name": "MiMo V2 Flash", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 32000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 128000, "output": 16384 }, "temperature": true, @@ -100807,113 +108459,150 @@ "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "attachment": true, + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "openai/o1", + "name": "OpenAI o1", + "display_name": "OpenAI o1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-25", - "last_updated": "2025-08-25", + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2024-09-12", + "last_updated": "2024-12-17", "cost": { - "input": 0.27, - "output": 1 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3-0324", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1-nano", + "display_name": "GPT-4.1-nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.25, - "output": 0.88 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2-Exp", - "name": "DeepSeek V3.2 Exp", - "display_name": "DeepSeek V3.2 Exp", + "id": "openai/o4-mini", + "name": "OpenAI o4-mini", + "display_name": "OpenAI o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "release_date": "2025-10-10", - "last_updated": "2025-10-10", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.27, - "output": 0.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", + "id": "openai/o3-mini", + "name": "OpenAI o3-mini", + "display_name": "OpenAI o3-mini", "modalities": { "input": [ "text" @@ -100923,10 +108612,10 @@ ] }, "limit": { - "context": 163840, - "output": 64000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": true, @@ -100935,65 +108624,80 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.5, - "output": 2.15 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "openai/o3", + "name": "OpenAI o3", + "display_name": "OpenAI o3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-03", - "last_updated": "2025-12-03", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.26, - "output": 0.38 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "openai/o1-mini", + "name": "OpenAI o1-mini", + "display_name": "OpenAI o1-mini", "modalities": { "input": [ "text" @@ -101003,11 +108707,11 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -101015,41 +108719,43 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2024-09-12", + "last_updated": "2024-12-17", "cost": { - "input": 0.6, - "output": 2.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "ai21-labs/ai21-jamba-1.5-mini", + "name": "AI21 Jamba 1.5 Mini", + "display_name": "AI21 Jamba 1.5 Mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -101057,32 +108763,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2024-08-29", + "last_updated": "2024-08-29", "cost": { - "input": 0.45, - "output": 2.8 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "ai21-labs/ai21-jamba-1.5-large", + "name": "AI21 Jamba 1.5 Large", + "display_name": "AI21 Jamba 1.5 Large", "modalities": { "input": [ "text" @@ -101092,8 +108787,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 256000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -101101,31 +108796,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2024-08-29", + "last_updated": "2024-08-29", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.1", - "name": "MiniMax M2.1", - "display_name": "MiniMax M2.1", + "id": "core42/jais-30b-chat", + "name": "JAIS 30b Chat", + "display_name": "JAIS 30b Chat", "modalities": { "input": [ "text" @@ -101135,8 +108820,8 @@ ] }, "limit": { - "context": 196608, - "output": 131072 + "context": 8192, + "output": 2048 }, "temperature": true, "tool_call": true, @@ -101144,72 +108829,54 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2023-03", + "release_date": "2023-08-30", + "last_updated": "2023-08-30", "cost": { - "input": 0.28, - "output": 1.2 + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "evroc": { - "id": "evroc", - "name": "evroc", - "display_name": "evroc", - "api": "https://models.think.evroc.com/v1", - "doc": "https://docs.evroc.com/products/think/overview.html", - "models": [ + }, { - "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", - "name": "Qwen3 VL 30B", - "display_name": "Qwen3 VL 30B", + "id": "microsoft/phi-3-medium-128k-instruct", + "name": "Phi-3-medium instruct (128k)", + "display_name": "Phi-3-medium instruct (128k)", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 100000, - "output": 100000 + "context": 128000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.24, - "output": 0.94 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Embedding-8B", - "name": "Qwen3 Embedding 8B", - "display_name": "Qwen3 Embedding 8B", + "id": "microsoft/phi-3-medium-4k-instruct", + "name": "Phi-3-medium instruct (4k)", + "display_name": "Phi-3-medium instruct (4k)", "modalities": { "input": [ "text" @@ -101219,27 +108886,30 @@ ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 4096, + "output": 1024 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.12, - "output": 0.12 + "input": 0, + "output": 0 }, - "type": "embedding" + "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507-FP8", - "name": "Qwen3 30B 2507", - "display_name": "Qwen3 30B 2507", + "id": "microsoft/phi-4", + "name": "Phi-4", + "display_name": "Phi-4", "modalities": { "input": [ "text" @@ -101249,27 +108919,30 @@ ] }, "limit": { - "context": 64000, - "output": 64000 + "context": 16000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.35, - "output": 1.42 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mistralai/devstral-small-2-24b-instruct-2512", - "name": "Devstral Small 2 24B Instruct 2512", - "display_name": "Devstral Small 2 24B Instruct 2512", + "id": "microsoft/phi-3-mini-128k-instruct", + "name": "Phi-3-mini instruct (128k)", + "display_name": "Phi-3-mini instruct (128k)", "modalities": { "input": [ "text" @@ -101279,30 +108952,32 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.12, - "output": 0.47 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mistralai/Voxtral-Small-24B-2507", - "name": "Voxtral Small 24B", - "display_name": "Voxtral Small 24B", + "id": "microsoft/phi-4-reasoning", + "name": "Phi-4-Reasoning", + "display_name": "Phi-4-Reasoning", "modalities": { "input": [ - "audio", "text" ], "output": [ @@ -101310,28 +108985,30 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.00236, - "output": 0.00236, - "output_audio": 2.36 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mistralai/Magistral-Small-2509", - "name": "Magistral Small 1.2 24B", - "display_name": "Magistral Small 1.2 24B", + "id": "microsoft/phi-3-small-128k-instruct", + "name": "Phi-3-small instruct (128k)", + "display_name": "Phi-3-small instruct (128k)", "modalities": { "input": [ "text" @@ -101341,27 +109018,30 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.59, - "output": 2.36 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "microsoft/Phi-4-multimodal-instruct", - "name": "Phi-4 15B", - "display_name": "Phi-4 15B", + "id": "microsoft/phi-3.5-vision-instruct", + "name": "Phi-3.5-vision instruct (128k)", + "display_name": "Phi-3.5-vision instruct (128k)", "modalities": { "input": [ "text", @@ -101372,58 +109052,63 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.24, - "output": 0.47 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "KBLab/kb-whisper-large", - "name": "KB Whisper", - "display_name": "KB Whisper", + "id": "microsoft/phi-3-small-8k-instruct", + "name": "Phi-3-small instruct (8k)", + "display_name": "Phi-3-small instruct (8k)", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 448, - "output": 448 + "context": 8192, + "output": 2048 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.00236, - "output": 0.00236, - "output_audio": 2.36 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "nvidia/Llama-3.3-70B-Instruct-FP8", - "name": "Llama 3.3 70B", - "display_name": "Llama 3.3 70B", + "id": "microsoft/phi-3.5-moe-instruct", + "name": "Phi-3.5-MoE instruct (128k)", + "display_name": "Phi-3.5-MoE instruct (128k)", "modalities": { "input": [ "text" @@ -101433,58 +109118,63 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 1.18, - "output": 1.18 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/whisper-large-v3", - "name": "Whisper 3 Large", - "display_name": "Whisper 3 Large", + "id": "microsoft/phi-3.5-mini-instruct", + "name": "Phi-3.5-mini instruct (128k)", + "display_name": "Phi-3.5-mini instruct (128k)", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 448, + "context": 128000, "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.00236, - "output": 0.00236, - "output_audio": 2.36 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "microsoft/mai-ds-r1", + "name": "MAI-DS-R1", + "display_name": "MAI-DS-R1", "modalities": { "input": [ "text" @@ -101495,76 +109185,62 @@ }, "limit": { "context": 65536, - "output": 65536 + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.24, - "output": 0.94 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "microsoft/phi-3-mini-4k-instruct", + "name": "Phi-3-mini instruct (4k)", + "display_name": "Phi-3-mini instruct (4k)", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 4096, + "output": 1024 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 1.47, - "output": 5.9 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "intfloat/multilingual-e5-large-instruct", - "name": "E5 Multi-Lingual Large Embeddings 0.6B", - "display_name": "E5 Multi-Lingual Large Embeddings 0.6B", + "id": "microsoft/phi-4-mini-instruct", + "name": "Phi-4-mini-instruct", + "display_name": "Phi-4-mini-instruct", "modalities": { "input": [ "text" @@ -101574,36 +109250,30 @@ ] }, "limit": { - "context": 512, - "output": 512 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.12, - "output": 0.12 + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "synthetic": { - "id": "synthetic", - "name": "Synthetic", - "display_name": "Synthetic", - "api": "https://api.synthetic.new/openai/v1", - "doc": "https://synthetic.new/pricing", - "models": [ + }, { - "id": "hf:meta-llama/Llama-3.1-405B-Instruct", - "name": "Llama-3.1-405B-Instruct", - "display_name": "Llama-3.1-405B-Instruct", + "id": "microsoft/phi-4-mini-reasoning", + "name": "Phi-4-mini-reasoning", + "display_name": "Phi-4-mini-reasoning", "modalities": { "input": [ "text" @@ -101614,7 +109284,7 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -101624,52 +109294,54 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 3, - "output": 3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:meta-llama/Llama-4-Scout-17B-16E-Instruct", - "name": "Llama-4-Scout-17B-16E-Instruct", - "display_name": "Llama-4-Scout-17B-16E-Instruct", + "id": "microsoft/phi-4-multimodal-instruct", + "name": "Phi-4-multimodal-instruct", + "display_name": "Phi-4-multimodal-instruct", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 328000, + "context": 128000, "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "mistral-ai/mistral-large-2411", + "name": "Mistral Large 24.11", + "display_name": "Mistral Large 24.11", "modalities": { "input": [ "text" @@ -101689,20 +109361,53 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.9, - "output": 0.9 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:meta-llama/Llama-3.1-8B-Instruct", - "name": "Llama-3.1-8B-Instruct", - "display_name": "Llama-3.1-8B-Instruct", + "id": "mistral-ai/codestral-2501", + "name": "Codestral 25.01", + "display_name": "Codestral 25.01", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + }, + { + "id": "mistral-ai/mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -101713,7 +109418,7 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -101723,22 +109428,23 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2024-03", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:meta-llama/Llama-3.1-70B-Instruct", - "name": "Llama-3.1-70B-Instruct", - "display_name": "Llama-3.1-70B-Instruct", + "id": "mistral-ai/mistral-small-2503", + "name": "Mistral Small 3.1", + "display_name": "Mistral Small 3.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -101755,20 +109461,20 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 0.9, - "output": 0.9 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", - "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", - "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "id": "mistral-ai/mistral-medium-2505", + "name": "Mistral Medium 3 (25.05)", + "display_name": "Mistral Medium 3 (25.05)", "modalities": { "input": [ "text", @@ -101779,29 +109485,30 @@ ] }, "limit": { - "context": 524000, - "output": 4096 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "attachment": false, + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", "cost": { - "input": 0.22, - "output": 0.88 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:MiniMaxAI/MiniMax-M2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "mistral-ai/ministral-3b", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ "text" @@ -101811,8 +109518,8 @@ ] }, "limit": { - "context": 196608, - "output": 131000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -101820,25 +109527,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "knowledge": "2024-03", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.55, - "output": 2.19 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "deepseek/deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -101848,8 +109551,8 @@ ] }, "limit": { - "context": 191488, - "output": 65536 + "context": 65536, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -101870,19 +109573,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-07", - "last_updated": "2026-02-07", + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:MiniMaxAI/MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "deepseek/deepseek-r1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ "text" @@ -101892,8 +109595,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 65536, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -101914,30 +109617,30 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2024-06", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.55, - "output": 2.19 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:Qwen/Qwen3.5-397B-A17B", - "name": "Qwen3.5-97B-A17B", - "display_name": "Qwen3.5-97B-A17B", + "id": "deepseek/deepseek-v3-0324", + "name": "DeepSeek-V3-0324", + "display_name": "DeepSeek-V3-0324", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -101945,32 +109648,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "knowledge": "2024-06", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:Qwen/Qwen2.5-Coder-32B-Instruct", - "name": "Qwen2.5-Coder-32B-Instruct", - "display_name": "Qwen2.5-Coder-32B-Instruct", + "id": "xai/grok-3-mini", + "name": "Grok 3 Mini", + "display_name": "Grok 3 Mini", "modalities": { "input": [ "text" @@ -101980,29 +109672,30 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, + "open_weights": false, "knowledge": "2024-10", - "release_date": "2024-11-11", - "last_updated": "2024-11-11", + "release_date": "2024-12-09", + "last_updated": "2024-12-09", "cost": { - "input": 0.8, - "output": 0.8 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen 3 235B Instruct", - "display_name": "Qwen 3 235B Instruct", + "id": "xai/grok-3", + "name": "Grok 3", + "display_name": "Grok 3", "modalities": { "input": [ "text" @@ -102012,29 +109705,30 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2025-07-21", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12-09", + "last_updated": "2024-12-09", "cost": { - "input": 0.2, - "output": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "meta/meta-llama-3.1-405b-instruct", + "name": "Meta-Llama-3.1-405B-Instruct", + "display_name": "Meta-Llama-3.1-405B-Instruct", "modalities": { "input": [ "text" @@ -102044,8 +109738,8 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -102053,32 +109747,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.65, - "output": 3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen 3 Coder 480B", - "display_name": "Qwen 3 Coder 480B", + "id": "meta/meta-llama-3.1-70b-instruct", + "name": "Meta-Llama-3.1-70B-Instruct", + "display_name": "Meta-Llama-3.1-70B-Instruct", "modalities": { "input": [ "text" @@ -102088,32 +109771,34 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 2, - "output": 2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:deepseek-ai/DeepSeek-V3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "meta/llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -102121,7 +109806,7 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -102130,22 +109815,24 @@ "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.56, - "output": 1.68 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:deepseek-ai/DeepSeek-V3-0324", - "name": "DeepSeek V3 (0324)", - "display_name": "DeepSeek V3 (0324)", + "id": "meta/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "display_name": "Llama 4 Scout 17B 16E Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -102153,27 +109840,29 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-01", - "last_updated": "2025-08-01", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 1.2, - "output": 1.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:deepseek-ai/DeepSeek-V3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "meta/meta-llama-3-70b-instruct", + "name": "Meta-Llama-3-70B-Instruct", + "display_name": "Meta-Llama-3-70B-Instruct", "modalities": { "input": [ "text" @@ -102183,8 +109872,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8192, + "output": 2048 }, "temperature": true, "tool_call": true, @@ -102194,22 +109883,24 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-29", + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 1.25, - "output": 1.25 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:deepseek-ai/DeepSeek-R1", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "meta/llama-3.2-90b-vision-instruct", + "name": "Llama-3.2-90B-Vision-Instruct", + "display_name": "Llama-3.2-90B-Vision-Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" @@ -102217,7 +109908,7 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -102225,32 +109916,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.55, - "output": 2.19 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek R1 (0528)", - "display_name": "DeepSeek R1 (0528)", + "id": "meta/meta-llama-3-8b-instruct", + "name": "Meta-Llama-3-8B-Instruct", + "display_name": "Meta-Llama-3-8B-Instruct", "modalities": { "input": [ "text" @@ -102260,8 +109940,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8192, + "output": 2048 }, "temperature": true, "tool_call": true, @@ -102269,42 +109949,34 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-01", - "last_updated": "2025-08-01", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 3, - "output": 8 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "meta/llama-3.2-11b-vision-instruct", + "name": "Llama-3.2-11B-Vision-Instruct", + "display_name": "Llama-3.2-11B-Vision-Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 162816, - "output": 8000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -102312,27 +109984,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": true, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.27, - "output": 0.4, - "cache_read": 0.27, - "cache_write": 0 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", + "id": "meta/meta-llama-3.1-8b-instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" @@ -102343,7 +110009,7 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -102352,19 +110018,20 @@ "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-22", - "last_updated": "2025-09-25", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 1.2, - "output": 1.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "hf:openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "meta/llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -102383,25 +110050,57 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0, + "output": 0 + }, + "type": "chat" + } + ] + }, + "qiniu-ai": { + "id": "qiniu-ai", + "name": "Qiniu", + "display_name": "Qiniu", + "api": "https://api.qnaigc.com/v1", + "doc": "https://developer.qiniu.com/aitokenapi", + "models": [ + { + "id": "qwen3-30b-a3b-instruct-2507", + "name": "Qwen3 30b A3b Instruct 2507", + "display_name": "Qwen3 30b A3b Instruct 2507", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, + "attachment": false, + "open_weights": false, + "release_date": "2026-02-04", + "last_updated": "2026-02-04", "type": "chat" }, { - "id": "hf:moonshotai/Kimi-K2-Thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "qwen3-max-preview", + "name": "Qwen3 Max Preview", + "display_name": "Qwen3 Max Preview", "modalities": { "input": [ "text" @@ -102411,14 +110110,13 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -102432,52 +110130,45 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-11", - "release_date": "2025-11-07", - "last_updated": "2025-11-07", - "cost": { - "input": 0.55, - "output": 2.19 - }, + "open_weights": false, + "release_date": "2025-09-06", + "last_updated": "2025-09-06", "type": "chat" }, { - "id": "hf:moonshotai/Kimi-K2-Instruct-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "doubao-seed-2.0-pro", + "name": "Doubao Seed 2.0 Pro", + "display_name": "Doubao Seed 2.0 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 256000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", - "cost": { - "input": 1.2, - "output": 1.2 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "type": "chat" }, { - "id": "hf:moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "claude-3.7-sonnet", + "name": "Claude 3.7 Sonnet", + "display_name": "Claude 3.7 Sonnet", "modalities": { "input": [ "text", @@ -102488,41 +110179,105 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", - "cost": { - "input": 0.55, - "output": 2.19 + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "type": "chat" + }, + { + "id": "doubao-seed-2.0-code", + "name": "Doubao Seed 2.0 Code", + "display_name": "Doubao Seed 2.0 Code", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", + "type": "chat" + }, + { + "id": "qwen2.5-vl-72b-instruct", + "name": "Qwen 2.5 VL 72B Instruct", + "display_name": "Qwen 2.5 VL 72B Instruct", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "hf:nvidia/NVIDIA-Nemotron-3-Super-120B-A12B-NVFP4", - "name": "Nemotron 3 Super 120B", - "display_name": "Nemotron 3 Super 120B", + "id": "deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -102532,8 +110287,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -102553,32 +110308,28 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2026-03-11", - "last_updated": "2026-04-03", - "cost": { - "input": 0.3, - "output": 1, - "cache_read": 0.3 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "hf:nvidia/Kimi-K2.5-NVFP4", - "name": "Kimi K2.5 (NVFP4)", - "display_name": "Kimi K2.5 (NVFP4)", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1048576, "output": 65536 }, "temperature": true, @@ -102590,29 +110341,32 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", - "cost": { - "input": 0.55, - "output": 2.19 - }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "hf:zai-org/GLM-4.7-Flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "deepseek-r1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ "text" @@ -102622,8 +110376,8 @@ ] }, "limit": { - "context": 196608, - "output": 65536 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -102643,20 +110397,15 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-18", - "last_updated": "2026-01-18", - "cost": { - "input": 0.06, - "output": 0.4, - "cache_read": 0.06 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "hf:zai-org/GLM-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "deepseek-v3-0324", + "name": "DeepSeek-V3-0324", + "display_name": "DeepSeek-V3-0324", "modalities": { "input": [ "text" @@ -102666,52 +110415,37 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 16000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", - "cost": { - "input": 0.55, - "output": 2.19 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "hf:zai-org/GLM-5.1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "doubao-seed-2.0-mini", + "name": "Doubao Seed 2.0 Mini", + "display_name": "Doubao Seed 2.0 Mini", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 65536 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -102719,43 +110453,28 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-04-12", - "cost": { - "input": 1, - "output": 3, - "cache_read": 1 - }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "type": "chat" }, { - "id": "hf:zai-org/GLM-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "claude-3.5-sonnet", + "name": "Claude 3.5 Sonnet", + "display_name": "Claude 3.5 Sonnet", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 65536 + "context": 200000, + "output": 8200 }, "temperature": true, "tool_call": true, @@ -102763,35 +110482,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-04-08", - "cost": { - "input": 1, - "output": 3, - "cache_read": 1 - }, + "attachment": true, + "open_weights": false, + "release_date": "2025-09-09", + "last_updated": "2025-09-09", "type": "chat" }, { - "id": "hf:zai-org/GLM-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "claude-4.0-sonnet", + "name": "Claude 4.0 Sonnet", + "display_name": "Claude 4.0 Sonnet", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -102807,38 +110511,29 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", - "cost": { - "input": 0.55, - "output": 2.19 - }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "hf:moonshotai/Kimi-K2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "doubao-seed-1.6-thinking", + "name": "Doubao-Seed 1.6 Thinking", + "display_name": "Doubao-Seed 1.6 Thinking", "modalities": { "input": [ + "image", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -102846,42 +110541,16 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", - "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.95 - }, + "open_weights": false, + "release_date": "2025-08-15", + "last_updated": "2025-08-15", "type": "chat" - } - ] - }, - "nvidia": { - "id": "nvidia", - "name": "Nvidia", - "display_name": "Nvidia", - "api": "https://integrate.api.nvidia.com/v1", - "doc": "https://docs.api.nvidia.com/nim/", - "models": [ + }, { - "id": "upstage/solar-10_7b-instruct", - "name": "solar-10.7b-instruct", - "display_name": "solar-10.7b-instruct", + "id": "deepseek-v3", + "name": "DeepSeek-V3", + "display_name": "DeepSeek-V3", "modalities": { "input": [ "text" @@ -102892,188 +110561,196 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 16000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-06-05", - "last_updated": "2025-04-10", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-13", + "last_updated": "2025-08-13", "type": "chat" }, { - "id": "black-forest-labs/flux_2-klein-4b", - "name": "FLUX.2 Klein 4B", - "display_name": "FLUX.2 Klein 4B", + "id": "qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "image", "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 262144, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-01-14", - "last_updated": "2026-01-31", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "type": "chat" }, { - "id": "black-forest-labs/flux.1-dev", - "name": "FLUX.1-dev", - "display_name": "FLUX.1-dev", + "id": "glm-4.5-air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 4096, - "output": 8192 + "context": 131000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-01", - "last_updated": "2025-09-05", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "black-forest-labs/flux_1-schnell", - "name": "FLUX.1-schnell", - "display_name": "FLUX.1-schnell", + "id": "qwen3-235b-a22b", + "name": "Qwen 3 235B A22B", + "display_name": "Qwen 3 235B A22B", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 77, - "output": 8192 + "context": 128000, + "output": 32000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-08-01", - "last_updated": "2026-02-04", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "black-forest-labs/flux_1-kontext-dev", - "name": "FLUX.1-Kontext-dev", - "display_name": "FLUX.1-Kontext-dev", + "id": "qwen3.5-397b-a17b", + "name": "Qwen3.5 397B A17B", + "display_name": "Qwen3.5 397B A17B", "modalities": { "input": [ "text", "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 256000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-08-12", - "last_updated": "2025-08-12", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-22", + "last_updated": "2026-02-22", "type": "chat" }, { - "id": "stepfun-ai/step-3.5-flash", - "name": "Step 3.5 Flash", - "display_name": "Step 3.5 Flash", + "id": "doubao-1.5-vision-pro", + "name": "Doubao 1.5 Vision Pro", + "display_name": "Doubao 1.5 Vision Pro", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 128000, + "output": 16000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-02", - "last_updated": "2026-02-02", - "cost": { - "input": 0, - "output": 0 + "supported": false }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "mistralai/mistral-large-3-675b-instruct-2512", - "name": "Mistral Large 3 675B Instruct 2512", - "display_name": "Mistral Large 3 675B Instruct 2512", + "id": "claude-4.5-haiku", + "name": "Claude 4.5 Haiku", + "display_name": "Claude 4.5 Haiku", "modalities": { "input": [ "text", @@ -103084,29 +110761,25 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-12-02", - "last_updated": "2025-12-02", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-10-16", + "last_updated": "2025-10-16", "type": "chat" }, { - "id": "mistralai/devstral-2-123b-instruct-2512", - "name": "Devstral-2-123B-Instruct-2512", - "display_name": "Devstral-2-123B-Instruct-2512", + "id": "qwen-max-2025-01-25", + "name": "Qwen2.5-Max-2025-01-25", + "display_name": "Qwen2.5-Max-2025-01-25", "modalities": { "input": [ "text" @@ -103116,30 +110789,24 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-08", - "last_updated": "2025-12-09", - "cost": { - "input": 0, - "output": 0 + "supported": false }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "mistralai/mistral-nemotron", - "name": "mistral-nemotron", - "display_name": "mistral-nemotron", + "id": "doubao-1.5-thinking-pro", + "name": "Doubao 1.5 Thinking Pro", + "display_name": "Doubao 1.5 Thinking Pro", "modalities": { "input": [ "text" @@ -103150,27 +110817,24 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 16000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-06-11", - "last_updated": "2025-06-12", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "mistralai/mixtral-8x22b-instruct", - "name": "Mistral: Mixtral 8x22B Instruct", - "display_name": "Mistral: Mixtral 8x22B Instruct", + "id": "glm-4.5", + "name": "GLM 4.5", + "display_name": "GLM 4.5", "modalities": { "input": [ "text" @@ -103180,59 +110844,55 @@ ] }, "limit": { - "context": 65536, - "output": 13108 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2024-04-17", - "last_updated": "2024-04-17", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "mistralai/mistral-medium-3-instruct", - "name": "Mistral Medium 3", - "display_name": "Mistral Medium 3", + "id": "qwen2.5-vl-7b-instruct", + "name": "Qwen 2.5 VL 7B Instruct", + "display_name": "Qwen 2.5 VL 7B Instruct", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "mistralai/mixtral-8x7b-instruct", - "name": "Mistral: Mixtral 8x7B Instruct", - "display_name": "Mistral: Mixtral 8x7B Instruct", + "id": "qwen-turbo", + "name": "Qwen-Turbo", + "display_name": "Qwen-Turbo", "modalities": { "input": [ "text" @@ -103242,28 +110902,36 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 1000000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2023-12-10", - "last_updated": "2026-03-15", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "mistralai/magistral-small-2506", - "name": "Magistral Small 2506", - "display_name": "Magistral Small 2506", + "id": "gpt-oss-20b", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ "text" @@ -103273,191 +110941,201 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "type": "chat" }, { - "id": "mistralai/mistral-7b-instruct-v03", - "name": "Mistral-7B-Instruct-v0.3", - "display_name": "Mistral-7B-Instruct-v0.3", + "id": "claude-4.0-opus", + "name": "Claude 4.0 Opus", + "display_name": "Claude 4.0 Opus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-01", - "last_updated": "2025-04-01", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "mistralai/mistral-small-4-119b-2603", - "name": "mistral-small-4-119b-2603", - "display_name": "mistral-small-4-119b-2603", + "id": "claude-4.5-sonnet", + "name": "Claude 4.5 Sonnet", + "display_name": "Claude 4.5 Sonnet", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "type": "chat" }, { - "id": "sarvamai/sarvam-m", - "name": "sarvam-m", - "display_name": "sarvam-m", + "id": "claude-4.5-opus", + "name": "Claude 4.5 Opus", + "display_name": "Claude 4.5 Opus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 200000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-25", - "last_updated": "2025-07-25", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-25", + "last_updated": "2025-11-25", "type": "chat" }, { - "id": "microsoft/phi-4-mini-instruct", - "name": "Phi-4-Mini", - "display_name": "Phi-4-Mini", + "id": "gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ "text", "image", - "audio" + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2025-09-05", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "microsoft/phi-4-multimodal-instruct", - "name": "Phi 4 Multimodal", - "display_name": "Phi 4 Multimodal", + "id": "claude-4.1-opus", + "name": "Claude 4.1 Opus", + "display_name": "Claude 4.1 Opus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "type": "chat" }, { - "id": "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning", - "name": "Nemotron 3 Nano Omni", - "display_name": "Nemotron 3 Nano Omni", + "id": "doubao-seed-1.6", + "name": "Doubao-Seed 1.6", + "display_name": "Doubao-Seed 1.6", "modalities": { "input": [ "text", "image", - "video", - "audio" + "video" ], "output": [ "text" @@ -103465,7 +111143,7 @@ }, "limit": { "context": 256000, - "output": 65536 + "output": 32000 }, "temperature": true, "tool_call": true, @@ -103474,19 +111152,15 @@ "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-28", - "last_updated": "2026-04-28", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-15", + "last_updated": "2025-08-15", "type": "chat" }, { - "id": "nvidia/usdvalidate", - "name": "usdvalidate", - "display_name": "usdvalidate", + "id": "qwen3-30b-a3b-thinking-2507", + "name": "Qwen3 30b A3b Thinking 2507", + "display_name": "Qwen3 30b A3b Thinking 2507", "modalities": { "input": [ "text" @@ -103496,165 +111170,188 @@ ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 126000, + "output": 32000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-24", - "last_updated": "2025-01-08", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2026-02-04", + "last_updated": "2026-02-04", "type": "chat" }, { - "id": "nvidia/synthetic-video-detector", - "name": "synthetic-video-detector", - "display_name": "synthetic-video-detector", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, + "context": 40000, "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-16", - "last_updated": "2026-04-16", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/cosmos-transfer1-7b", - "name": "cosmos-transfer1-7b", - "display_name": "cosmos-transfer1-7b", + "id": "qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 131072, + "output": 32768 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-06-13", - "last_updated": "2025-06-30", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-12", + "last_updated": "2025-09-12", "type": "chat" }, { - "id": "nvidia/rerank-qa-mistral-4b", - "name": "rerank-qa-mistral-4b", - "display_name": "rerank-qa-mistral-4b", + "id": "gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "display_name": "Gemini 2.0 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1048576, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-03-17", - "last_updated": "2025-01-17", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/nv-embedcode-7b-v1", - "name": "nv-embedcode-7b-v1", - "display_name": "nv-embedcode-7b-v1", + "id": "qwen-vl-max-2025-01-25", + "name": "Qwen VL-MAX-2025-01-25", + "display_name": "Qwen VL-MAX-2025-01-25", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 128000, + "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-03-17", - "last_updated": "2025-05-29", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/nemotron-3-super-120b-a12b", - "name": "Nemotron 3 Super", - "display_name": "Nemotron 3 Super", + "id": "doubao-seed-2.0-lite", + "name": "Doubao Seed 2.0 Lite", + "display_name": "Doubao Seed 2.0 Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -103662,21 +111359,16 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2026-03-11", - "last_updated": "2026-03-11", - "cost": { - "input": 0.2, - "output": 0.8 - }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "type": "chat" }, { - "id": "nvidia/riva-translate-4b-instruct-v1_1", - "name": "riva-translate-4b-instruct-v1_1", - "display_name": "riva-translate-4b-instruct-v1_1", + "id": "qwen3-30b-a3b", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ "text" @@ -103686,32 +111378,41 @@ ] }, "limit": { - "context": 128000, + "context": 40000, "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-12", - "last_updated": "2025-12-12", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/nemotron-voicechat", - "name": "nemotron-voicechat", - "display_name": "nemotron-voicechat", + "id": "qwen3-vl-30b-a3b-thinking", + "name": "Qwen3-Vl 30b A3b Thinking", + "display_name": "Qwen3-Vl 30b A3b Thinking", "modalities": { "input": [ "text", - "audio" + "image", + "video" ], "output": [ "text" @@ -103719,27 +111420,34 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, - "open_weights": true, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-09", + "last_updated": "2026-02-09", "type": "chat" }, { - "id": "nvidia/llama-3_3-nemotron-super-49b-v1_5", - "name": "Llama 3.3 Nemotron Super 49B v1.5", - "display_name": "Llama 3.3 Nemotron Super 49B v1.5", + "id": "deepseek-v3.1", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ "text" @@ -103749,8 +111457,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -103759,82 +111467,91 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-19", + "last_updated": "2025-08-19", "type": "chat" }, { - "id": "nvidia/usdcode", - "name": "usdcode", - "display_name": "usdcode", + "id": "gemini-3.0-pro-image-preview", + "name": "Gemini 3.0 Pro Image Preview", + "display_name": "Gemini 3.0 Pro Image Preview", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2026-01-01", - "last_updated": "2026-01-01", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "type": "chat" }, { - "id": "nvidia/llama-3_2-nemoretriever-300m-embed-v1", - "name": "llama-3_2-nemoretriever-300m-embed-v1", - "display_name": "llama-3_2-nemoretriever-300m-embed-v1", + "id": "kling-v2-6", + "name": "Kling-V2 6", + "display_name": "Kling-V2 6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 99999999, + "output": 99999999 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-24", - "last_updated": "2025-07-24", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": true, + "open_weights": false, + "release_date": "2026-01-13", + "last_updated": "2026-01-13", "type": "chat" }, { - "id": "nvidia/llama-3_1-nemotron-safety-guard-8b-v3", - "name": "llama-3.1-nemotron-safety-guard-8b-v3", - "display_name": "llama-3.1-nemotron-safety-guard-8b-v3", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235b A22B Instruct 2507", + "display_name": "Qwen3 235b A22B Instruct 2507", "modalities": { "input": [ "text" @@ -103844,28 +111561,24 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-10-28", - "last_updated": "2025-10-28", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-12", + "last_updated": "2025-08-12", "type": "chat" }, { - "id": "nvidia/nv-embed-v1", - "name": "nv-embed-v1", - "display_name": "nv-embed-v1", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -103875,39 +111588,39 @@ ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 262000, + "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-06-07", - "last_updated": "2025-07-22", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-14", + "last_updated": "2025-08-14", "type": "chat" }, { - "id": "nvidia/nemotron-3-nano-30b-a3b", - "name": "nemotron-3-nano-30b-a3b", - "display_name": "nemotron-3-nano-30b-a3b", + "id": "gemini-3.0-pro-preview", + "name": "Gemini 3.0 Pro Preview", + "display_name": "Gemini 3.0 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "pdf", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -103915,21 +111628,33 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-12", - "last_updated": "2024-12", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "type": "chat" }, { - "id": "nvidia/gliner-pii", - "name": "gliner-pii", - "display_name": "gliner-pii", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ "text" @@ -103939,59 +111664,36 @@ ] }, "limit": { - "context": 128000, + "context": 262144, "output": 4096 }, "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-03", - "last_updated": "2026-03-03", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - }, - { - "id": "nvidia/bevformer", - "name": "bevformer", - "display_name": "bevformer", - "modalities": { - "input": [ - "video" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 8192 - }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-03-18", - "last_updated": "2025-07-20", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-12", + "last_updated": "2025-08-12", "type": "chat" }, { - "id": "nvidia/nemotron-mini-4b-instruct", - "name": "nemotron-mini-4b-instruct", - "display_name": "nemotron-mini-4b-instruct", + "id": "kimi-k2", + "name": "Kimi K2", + "display_name": "Kimi K2", "modalities": { "input": [ "text" @@ -104002,7 +111704,7 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 128000 }, "temperature": true, "tool_call": true, @@ -104010,19 +111712,15 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-08-21", - "last_updated": "2024-08-26", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/cosmos-predict1-5b", - "name": "cosmos-predict1-5b", - "display_name": "cosmos-predict1-5b", + "id": "doubao-seed-1.6-flash", + "name": "Doubao-Seed 1.6 Flash", + "display_name": "Doubao-Seed 1.6 Flash", "modalities": { "input": [ "text", @@ -104030,32 +111728,29 @@ "video" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 256000, + "output": 32000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-18", - "last_updated": "2025-03-18", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-15", + "last_updated": "2025-08-15", "type": "chat" }, { - "id": "nvidia/llama-3_3-nemotron-super-49b-v1", - "name": "Llama 3.3 Nemotron Super 49B v1", - "display_name": "Llama 3.3 Nemotron Super 49B v1", + "id": "MiniMax-M1", + "name": "MiniMax M1", + "display_name": "MiniMax M1", "modalities": { "input": [ "text" @@ -104065,8 +111760,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1000000, + "output": 80000 }, "temperature": true, "tool_call": true, @@ -104075,31 +111770,29 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-04-07", - "last_updated": "2025-04-07", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/nvidia-nemotron-nano-9b-v2", - "name": "nvidia-nemotron-nano-9b-v2", - "display_name": "nvidia-nemotron-nano-9b-v2", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -104107,54 +111800,64 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-09", - "release_date": "2025-08-18", - "last_updated": "2025-08-18", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/cosmos-transfer2_5-2b", - "name": "cosmos-transfer2.5-2b", - "display_name": "cosmos-transfer2.5-2b", + "id": "gemini-2.5-flash-image", + "name": "Gemini 2.5 Flash Image", + "display_name": "Gemini 2.5 Flash Image", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ - "video" + "image" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 32768, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-02-26", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "open_weights": false, + "release_date": "2025-10-22", + "last_updated": "2025-10-22", + "type": "imageGeneration" }, { - "id": "nvidia/nemotron-content-safety-reasoning-4b", - "name": "nemotron-content-safety-reasoning-4b", - "display_name": "nemotron-content-safety-reasoning-4b", + "id": "doubao-1.5-pro-32k", + "name": "Doubao 1.5 Pro 32k", + "display_name": "Doubao 1.5 Pro 32k", "modalities": { "input": [ "text" @@ -104165,94 +111868,81 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 12000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-22", - "last_updated": "2026-01-22", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/active-speaker-detection", - "name": "Active Speaker Detection", - "display_name": "Active Speaker Detection", + "id": "qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 131072, + "output": 32768 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-16", - "last_updated": "2026-04-16", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-12", + "last_updated": "2025-09-12", "type": "chat" }, { - "id": "nvidia/magpie-tts-zeroshot", - "name": "magpie-tts-zeroshot", - "display_name": "magpie-tts-zeroshot", + "id": "claude-3.5-haiku", + "name": "Claude 3.5 Haiku", + "display_name": "Claude 3.5 Haiku", "modalities": { "input": [ "text", - "audio" + "image" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 200000, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-05-22", - "last_updated": "2025-06-12", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-26", + "last_updated": "2025-08-26", "type": "chat" }, { - "id": "nvidia/streampetr", - "name": "streampetr", - "display_name": "streampetr", + "id": "gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ - "video" + "text" ], "output": [ "text" @@ -104260,29 +111950,34 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "type": "chat" }, { - "id": "nvidia/sparsedrive", - "name": "sparsedrive", - "display_name": "sparsedrive", + "id": "gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", "modalities": { "input": [ + "text", + "image", + "audio", "video" ], "output": [ @@ -104290,91 +111985,115 @@ ] }, "limit": { - "context": 128000, + "context": 1048576, "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-18", - "last_updated": "2025-07-20", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "nvidia/nemotron-3-content-safety", - "name": "nemotron-3-content-safety", - "display_name": "nemotron-3-content-safety", + "id": "gemini-3.0-flash-preview", + "name": "Gemini 3.0 Flash Preview", + "display_name": "Gemini 3.0 Flash Preview", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-16", - "last_updated": "2026-04-16", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "type": "chat" }, { - "id": "nvidia/llama-nemotron-embed-vl-1b-v2", - "name": "llama-nemotron-embed-vl-1b-v2", - "display_name": "llama-nemotron-embed-vl-1b-v2", + "id": "moonshotai/kimi-k2.5", + "name": "Moonshotai/Kimi-K2.5", + "display_name": "Moonshotai/Kimi-K2.5", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 256000, + "output": 256000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-10", - "last_updated": "2026-02-10", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": true, + "open_weights": false, + "release_date": "2026-01-28", + "last_updated": "2026-01-28", "type": "chat" }, { - "id": "nvidia/studiovoice", - "name": "studiovoice", - "display_name": "studiovoice", + "id": "moonshotai/kimi-k2-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -104384,98 +112103,90 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 256000, + "output": 100000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-10-03", - "last_updated": "2025-06-13", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-09-08", + "last_updated": "2025-09-08", "type": "chat" }, { - "id": "nvidia/llama-nemotron-rerank-vl-1b-v2", - "name": "llama-nemotron-rerank-vl-1b-v2", - "display_name": "llama-nemotron-rerank-vl-1b-v2", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 100000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, - "open_weights": true, - "release_date": "2026-03-31", - "last_updated": "2026-03-31", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-07", + "last_updated": "2025-11-07", "type": "chat" }, { - "id": "deepseek-ai/deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "z-ai/autoglm-phone-9b", + "name": "Z-Ai/Autoglm Phone 9b", + "display_name": "Z-Ai/Autoglm Phone 9b", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 12800, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "type": "chat" }, { - "id": "deepseek-ai/deepseek-v3.1-terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", + "id": "z-ai/glm-4.6", + "name": "Z-AI/GLM 4.6", + "display_name": "Z-AI/GLM 4.6", "modalities": { "input": [ "text" @@ -104485,62 +112196,68 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 200000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-10-11", + "last_updated": "2025-10-11", "type": "chat" }, { - "id": "openai/whisper-large-v3", - "name": "Whisper Large v3", - "display_name": "Whisper Large v3", + "id": "z-ai/glm-4.7", + "name": "Z-Ai/GLM 4.7", + "display_name": "Z-Ai/GLM 4.7", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 200000, + "output": 200000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-09", - "release_date": "2023-09-01", - "last_updated": "2025-09-05", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "z-ai/glm-5", + "name": "Z-Ai/GLM 5", + "display_name": "Z-Ai/GLM 5", "modalities": { "input": [ "text" @@ -104550,8 +112267,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -104561,61 +112278,76 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT-OSS-120B", - "display_name": "GPT-OSS-120B", + "id": "openai/gpt-5.2", + "name": "OpenAI/GPT-5.2", + "display_name": "OpenAI/GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08", - "release_date": "2025-08-04", - "last_updated": "2025-08-14", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "type": "chat" }, { - "id": "minimaxai/minimax-m2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "openai/gpt-5", + "name": "OpenAI/GPT-5", + "display_name": "OpenAI/GPT-5", "modalities": { "input": [ "text" @@ -104625,8 +112357,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -104637,28 +112369,34 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-04-11", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "type": "chat" }, { - "id": "minimaxai/minimax-m2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "minimax/minimax-m2.1", + "name": "Minimax/Minimax-M2.1", + "display_name": "Minimax/Minimax-M2.1", "modalities": { "input": [ "text" @@ -104669,7 +112407,7 @@ }, "limit": { "context": 204800, - "output": 131072 + "output": 128000 }, "temperature": true, "tool_call": true, @@ -104683,20 +112421,15 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-08", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "type": "chat" }, { - "id": "z-ai/glm4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "minimax/minimax-m2", + "name": "Minimax/Minimax-M2", + "display_name": "Minimax/Minimax-M2", "modalities": { "input": [ "text" @@ -104706,8 +112439,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -104717,30 +112450,19 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-10-28", + "last_updated": "2025-10-28", "type": "chat" }, { - "id": "z-ai/glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "minimax/minimax-m2.5", + "name": "Minimax/Minimax-M2.5", + "display_name": "Minimax/Minimax-M2.5", "modalities": { "input": [ "text" @@ -104750,8 +112472,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 204800, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -104761,29 +112483,19 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "type": "chat" }, { - "id": "meta/esm2-650m", - "name": "esm2-650m", - "display_name": "esm2-650m", + "id": "minimax/minimax-m2.5-highspeed", + "name": "Minimax/Minimax-M2.5 Highspeed", + "display_name": "Minimax/Minimax-M2.5 Highspeed", "modalities": { "input": [ "text" @@ -104793,28 +112505,30 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 204800, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-08-29", - "last_updated": "2025-03-10", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true + } }, + "attachment": false, + "open_weights": false, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "type": "chat" }, { - "id": "meta/llama-3.3-70b-instruct", - "name": "Llama 3.3 70b Instruct", - "display_name": "Llama 3.3 70b Instruct", + "id": "x-ai/grok-code-fast-1", + "name": "x-AI/Grok-Code-Fast 1", + "display_name": "x-AI/Grok-Code-Fast 1", "modalities": { "input": [ "text" @@ -104824,224 +112538,221 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 10000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-11-26", - "last_updated": "2024-11-26", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-02", + "last_updated": "2025-09-02", "type": "chat" }, { - "id": "meta/esmfold", - "name": "esmfold", - "display_name": "esmfold", + "id": "x-ai/grok-4.1-fast-reasoning", + "name": "X-Ai/Grok 4.1 Fast Reasoning", + "display_name": "X-Ai/Grok 4.1 Fast Reasoning", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 20000000, + "output": 2000000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-03-15", - "last_updated": "2025-06-12", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-19", + "last_updated": "2025-12-19", "type": "chat" }, { - "id": "meta/llama-3.2-90b-vision-instruct", - "name": "Llama-3.2-90B-Vision-Instruct", - "display_name": "Llama-3.2-90B-Vision-Instruct", + "id": "x-ai/grok-4.1-fast-non-reasoning", + "name": "X-Ai/Grok 4.1 Fast Non Reasoning", + "display_name": "X-Ai/Grok 4.1 Fast Non Reasoning", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-12-19", + "last_updated": "2025-12-19", "type": "chat" }, { - "id": "meta/llama-3.2-11b-vision-instruct", - "name": "Llama 3.2 11b Vision Instruct", - "display_name": "Llama 3.2 11b Vision Instruct", + "id": "x-ai/grok-4-fast", + "name": "x-AI/Grok-4-Fast", + "display_name": "x-AI/Grok-4-Fast", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-18", - "last_updated": "2024-09-18", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-09-20", + "last_updated": "2025-09-20", "type": "chat" }, { - "id": "meta/llama-guard-4-12b", - "name": "Llama Guard 4 12B", - "display_name": "Llama Guard 4 12B", + "id": "x-ai/grok-4.1-fast", + "name": "x-AI/Grok-4.1-Fast", + "display_name": "x-AI/Grok-4.1-Fast", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 2000000, + "output": 2000000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2026-04-30", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "type": "chat" }, { - "id": "meta/llama-3.1-70b-instruct", - "name": "Llama 3.1 70b Instruct", - "display_name": "Llama 3.1 70b Instruct", + "id": "x-ai/grok-4-fast-non-reasoning", + "name": "X-Ai/Grok-4-Fast-Non-Reasoning", + "display_name": "X-Ai/Grok-4-Fast-Non-Reasoning", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-16", - "last_updated": "2024-07-16", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "type": "chat" }, { - "id": "meta/llama-3.2-1b-instruct", - "name": "Llama 3.2 1b Instruct", - "display_name": "Llama 3.2 1b Instruct", + "id": "x-ai/grok-4-fast-reasoning", + "name": "X-Ai/Grok-4-Fast-Reasoning", + "display_name": "X-Ai/Grok-4-Fast-Reasoning", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-18", - "last_updated": "2024-09-18", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true + } }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "type": "chat" }, { - "id": "meta/llama-4-maverick-17b-128e-instruct", - "name": "Llama 4 Maverick 17b 128e Instruct", - "display_name": "Llama 4 Maverick 17b 128e Instruct", + "id": "deepseek/deepseek-v3.2-exp", + "name": "DeepSeek/DeepSeek-V3.2-Exp", + "display_name": "DeepSeek/DeepSeek-V3.2-Exp", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -105049,28 +112760,23 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-02", - "release_date": "2025-04-01", - "last_updated": "2025-04-01", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "type": "chat" }, { - "id": "meta/llama-3.2-3b-instruct", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "deepseek/deepseek-v3.1-terminus-thinking", + "name": "DeepSeek/DeepSeek-V3.1-Terminus-Thinking", + "display_name": "DeepSeek/DeepSeek-V3.1-Terminus-Thinking", "modalities": { "input": [ "text" @@ -105080,28 +112786,25 @@ ] }, "limit": { - "context": 32768, + "context": 128000, "output": 32000 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2024-09-18", - "last_updated": "2024-09-18", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "type": "chat" }, { - "id": "meta/llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "deepseek/deepseek-math-v2", + "name": "Deepseek/Deepseek-Math-V2", + "display_name": "Deepseek/Deepseek-Math-V2", "modalities": { "input": [ "text" @@ -105111,107 +112814,81 @@ ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 160000, + "output": 160000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-12-04", + "last_updated": "2025-12-04", "type": "chat" }, { - "id": "qwen/qwen-image-edit", - "name": "Qwen Image Edit", - "display_name": "Qwen Image Edit", + "id": "deepseek/deepseek-v3.2-251201", + "name": "Deepseek/DeepSeek-V3.2", + "display_name": "Deepseek/DeepSeek-V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-19", - "last_updated": "2025-08-19", - "cost": { - "input": 0, - "output": 0 - }, - "type": "imageGeneration" + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "type": "chat" }, { - "id": "qwen/qwen3.5-122b-a10b", - "name": "Qwen3.5 122B-A10B", - "display_name": "Qwen3.5 122B-A10B", + "id": "deepseek/deepseek-v3.2-exp-thinking", + "name": "DeepSeek/DeepSeek-V3.2-Exp-Thinking", + "display_name": "DeepSeek/DeepSeek-V3.2-Exp-Thinking", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-23", - "last_updated": "2026-02-23", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "type": "chat" }, { - "id": "qwen/qwen2.5-coder-32b-instruct", - "name": "Qwen2.5 Coder 32b Instruct", - "display_name": "Qwen2.5 Coder 32b Instruct", + "id": "deepseek/deepseek-v3.1-terminus", + "name": "DeepSeek/DeepSeek-V3.1-Terminus", + "display_name": "DeepSeek/DeepSeek-V3.1-Terminus", "modalities": { "input": [ "text" @@ -105222,7 +112899,7 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 32000 }, "temperature": true, "tool_call": true, @@ -105230,19 +112907,15 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-11-06", - "last_updated": "2024-11-06", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "type": "chat" }, { - "id": "qwen/qwen3.5-397b-a17b", - "name": "Qwen3.5-397B-A17B", - "display_name": "Qwen3.5-397B-A17B", + "id": "stepfun/step-3.5-flash", + "name": "Stepfun/Step-3.5 Flash", + "display_name": "Stepfun/Step-3.5 Flash", "modalities": { "input": [ "text", @@ -105253,41 +112926,24 @@ ] }, "limit": { - "context": 262144, - "output": 8192 + "context": 64000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2026-02-02", + "last_updated": "2026-02-02", "type": "chat" }, { - "id": "qwen/qwen3-next-80b-a3b-thinking", - "name": "Qwen3-Next-80B-A3B-Thinking", - "display_name": "Qwen3-Next-80B-A3B-Thinking", + "id": "meituan/longcat-flash-chat", + "name": "Meituan/Longcat-Flash-Chat", + "display_name": "Meituan/Longcat-Flash-Chat", "modalities": { "input": [ "text" @@ -105297,41 +112953,24 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2025-09-05", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-11-05", + "last_updated": "2025-11-05", "type": "chat" }, { - "id": "qwen/qwen3-next-80b-a3b-instruct", - "name": "Qwen3-Next-80B-A3B-Instruct", - "display_name": "Qwen3-Next-80B-A3B-Instruct", + "id": "meituan/longcat-flash-lite", + "name": "Meituan/Longcat-Flash-Lite", + "display_name": "Meituan/Longcat-Flash-Lite", "modalities": { "input": [ "text" @@ -105341,8 +112980,8 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 256000, + "output": 320000 }, "temperature": true, "tool_call": true, @@ -105351,51 +112990,42 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2025-09-05", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2026-02-06", + "last_updated": "2026-02-06", "type": "chat" }, { - "id": "qwen/qwen-image", - "name": "Qwen Image", - "display_name": "Qwen Image", + "id": "stepfun-ai/gelab-zero-4b-preview", + "name": "Stepfun-Ai/Gelab Zero 4b Preview", + "display_name": "Stepfun-Ai/Gelab Zero 4b Preview", "modalities": { "input": [ "text", "image" ], "output": [ - "image" + "text" ] }, "limit": { "context": 8192, - "output": 8192 + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 0, - "output": 0 - }, - "type": "imageGeneration" + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "type": "chat" }, { - "id": "qwen/qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "mimo-v2-flash", + "name": "Mimo-V2-Flash", + "display_name": "Mimo-V2-Flash", "modalities": { "input": [ "text" @@ -105405,29 +113035,31 @@ ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": true, + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.3, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "google/gemma-2-2b-it", - "name": "Gemma 2 2b It", - "display_name": "Gemma 2 2b It", + "id": "xiaomi/mimo-v2-flash", + "name": "Xiaomi/Mimo-V2-Flash", + "display_name": "Xiaomi/Mimo-V2-Flash", "modalities": { "input": [ "text" @@ -105437,66 +113069,82 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-07-16", - "last_updated": "2024-07-16", + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.3, + "cache_read": 0.01 }, "type": "chat" - }, + } + ] + }, + "google": { + "id": "google", + "name": "google", + "display_name": "google", + "doc": "https://ai.google.dev/gemini-api/docs/models", + "models": [ { - "id": "google/gemma-3n-e4b-it", - "name": "Gemma 3n E4b It", - "display_name": "Gemma 3n E4b It", + "id": "gemini-flash-latest", + "name": "Gemini Flash Latest", + "display_name": "Gemini Flash Latest", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-06-03", - "last_updated": "2025-06-03", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "input_audio": 1 }, "type": "chat" }, { - "id": "google/gemma-4-31b-it", - "name": "Gemma-4-31B-IT", - "display_name": "Gemma-4-31B-IT", + "id": "gemma-4-26b-a4b-it", + "name": "Gemma 4 26B", + "display_name": "Gemma 4 26B", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" @@ -105504,7 +113152,7 @@ }, "limit": { "context": 256000, - "output": 16384 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -105512,33 +113160,30 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", "release_date": "2026-04-02", "last_updated": "2026-04-02", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "google/gemma-3n-e2b-it", - "name": "Gemma 3n E2b It", - "display_name": "Gemma 3n E2b It", + "id": "gemini-1.5-flash", + "name": "Gemini 1.5 Flash", + "display_name": "Gemini 1.5 Flash", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -105546,32 +113191,36 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-06-12", - "last_updated": "2025-06-12", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-05-14", + "last_updated": "2024-05-14", "cost": { - "input": 0, - "output": 0 + "input": 0.075, + "output": 0.3, + "cache_read": 0.01875 }, "type": "chat" }, { - "id": "google/gemma-3-27b-it", - "name": "Gemma-3-27B-IT", - "display_name": "Gemma-3-27B-IT", + "id": "gemini-3.1-flash-lite", + "name": "Gemini 3.1 Flash Lite", + "display_name": "Gemini 3.1 Flash Lite", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -105579,21 +113228,28 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2025-09-05", + "knowledge": "2025-01", + "release_date": "2026-05-07", + "last_updated": "2026-05-07", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "google/google-paligemma", - "name": "paligemma", - "display_name": "paligemma", + "id": "gemini-2.5-flash-preview-09-2025", + "name": "Gemini 2.5 Flash Preview 09 2025", + "display_name": "Gemini 2.5 Flash Preview 09 2025", "modalities": { "input": [ "text", @@ -105604,74 +113260,155 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": -1, + "min": 0, + "max": 24576 + } + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "search": { + "supported": true, + "default": false }, "attachment": true, - "open_weights": true, - "release_date": "2024-05-14", - "last_updated": "2024-08-26", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "input_audio": 1 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": -1, + "min": 128, + "max": 32768 + } }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "search": { + "supported": true, + "default": false + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-01", - "release_date": "2025-01-01", - "last_updated": "2025-09-05", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + } }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "gemini-2.5-flash-preview-04-17", + "name": "Gemini 2.5 Flash Preview 04-17", + "display_name": "Gemini 2.5 Flash Preview 04-17", "modalities": { "input": [ "text", "image", - "video" + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -105682,51 +113419,62 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, - "open_weights": true, + "open_weights": false, "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "release_date": "2025-04-17", + "last_updated": "2025-04-17", "cost": { - "input": 0, - "output": 0 + "input": 0.15, + "output": 0.6, + "cache_read": 0.0375 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-instruct-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "gemma-3-27b-it", + "name": "Gemma 3 27B", + "display_name": "Gemma 3 27B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "release_date": "2025-03-12", + "last_updated": "2025-03-12", "cost": { "input": 0, "output": 0 @@ -105734,20 +113482,21 @@ "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "gemma-4-31b-it", + "name": "Gemma 4 31B", + "display_name": "Gemma 4 31B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -105755,180 +113504,212 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-11", - "last_updated": "2025-12", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "type": "chat" }, { - "id": "abacusai/dracarys-llama-3_1-70b-instruct", - "name": "dracarys-llama-3.1-70b-instruct", - "display_name": "dracarys-llama-3.1-70b-instruct", + "id": "gemini-2.5-pro-preview-tts", + "name": "Gemini 2.5 Pro Preview TTS", + "display_name": "Gemini 2.5 Pro Preview TTS", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 8000, + "output": 16000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": false, - "open_weights": true, - "release_date": "2024-09-11", - "last_updated": "2025-05-22", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", "cost": { - "input": 0, - "output": 0 + "input": 1, + "output": 20 }, "type": "chat" }, { - "id": "baai/bge-m3", - "name": "BGE M3", - "display_name": "BGE M3", + "id": "gemini-2.5-flash-preview-05-20", + "name": "Gemini 2.5 Flash Preview 05-20", + "display_name": "Gemini 2.5 Flash Preview 05-20", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1024 + "context": 1048576, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-01-30", - "last_updated": "2026-04-30", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 0, - "output": 0 + "input": 0.15, + "output": 0.6, + "cache_read": 0.0375 }, - "type": "embedding" + "type": "chat" }, { - "id": "bytedance/seed-oss-36b-instruct", - "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", - "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "id": "gemini-3.1-flash-image-preview", + "name": "Gemini 3.1 Flash Image (Preview)", + "display_name": "Gemini 3.1 Flash Image (Preview)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-04", - "last_updated": "2025-11-25", + "knowledge": "2025-01", + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "cost": { - "input": 0, - "output": 0 + "input": 0.5, + "output": 60 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "deepseek-ai/deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "gemini-live-2.5-flash-preview-native-audio", + "name": "Gemini Live 2.5 Flash Preview Native Audio", + "display_name": "Gemini Live 2.5 Flash Preview Native Audio", "modalities": { "input": [ - "text" + "text", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 131072, + "output": 65536 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-09-18", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 0.5, + "output": 2, + "input_audio": 3, + "output_audio": 12 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "gemini-2.5-pro-preview-06-05", + "name": "Gemini 2.5 Pro Preview 06-05", + "display_name": "Gemini 2.5 Pro Preview 06-05", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" @@ -105936,7 +113717,7 @@ }, "limit": { "context": 1048576, - "output": 393216 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -105947,39 +113728,38 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 1.25, + "output": 10, + "cache_read": 0.31 }, "type": "chat" - } - ] - }, - "inference": { - "id": "inference", - "name": "Inference", - "display_name": "Inference", - "api": "https://inference.net/v1", - "doc": "https://inference.net/models", - "models": [ + }, { - "id": "mistral/mistral-nemo-12b-instruct", - "name": "Mistral Nemo 12B Instruct", - "display_name": "Mistral Nemo 12B Instruct", + "id": "gemma-3n-e2b-it", + "name": "Gemma 3n 2B", + "display_name": "Gemma 3n 2B", "modalities": { "input": [ "text" @@ -105989,223 +113769,354 @@ ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 8192, + "output": 2000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2024-10", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.038, - "output": 0.1 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta/llama-3.2-11b-vision-instruct", - "name": "Llama 3.2 11B Vision Instruct", - "display_name": "Llama 3.2 11B Vision Instruct", + "id": "gemma-3n-e4b-it", + "name": "Gemma 3n 4B", + "display_name": "Gemma 3n 4B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 8192, + "output": 2000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2024-10", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 0.055, - "output": 0.055 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta/llama-3.2-1b-instruct", - "name": "Llama 3.2 1B Instruct", - "display_name": "Llama 3.2 1B Instruct", + "id": "gemini-2.5-pro-preview-05-06", + "name": "Gemini 2.5 Pro Preview 05-06", + "display_name": "Gemini 2.5 Pro Preview 05-06", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-05-06", + "last_updated": "2025-05-06", "cost": { - "input": 0.01, - "output": 0.01 + "input": 1.25, + "output": 10, + "cache_read": 0.31 }, "type": "chat" }, { - "id": "meta/llama-3.2-3b-instruct", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "gemini-2.5-flash-lite-preview-09-2025", + "name": "Gemini 2.5 Flash Lite Preview 09 2025", + "display_name": "Gemini 2.5 Flash Lite Preview 09 2025", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": -1, + "min": 512, + "max": 24576 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "search": { + "supported": true, + "default": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.02, - "output": 0.02 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "meta/llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": -1, + "min": 512, + "max": 24576 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "search": { + "supported": true, + "default": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.025, - "output": 0.025 + "input": 0.1, + "output": 0.4, + "cache_read": 0.01, + "input_audio": 0.3 }, "type": "chat" }, { - "id": "qwen/qwen-2.5-7b-vision-instruct", - "name": "Qwen 2.5 7B Vision Instruct", - "display_name": "Qwen 2.5 7B Vision Instruct", + "id": "gemini-flash-lite-latest", + "name": "Gemini Flash-Lite Latest", + "display_name": "Gemini Flash-Lite Latest", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 125000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "qwen/qwen3-embedding-4b", - "name": "Qwen 3 Embedding 4B", - "display_name": "Qwen 3 Embedding 4B", + "id": "gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 2048 + "context": 1000000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.01, - "output": 0 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, - "type": "embedding" + "type": "chat" }, { - "id": "google/gemma-3", - "name": "Google Gemma 3", - "display_name": "Google Gemma 3", + "id": "gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "display_name": "Gemini 2.0 Flash Lite", "modalities": { "input": [ "text", @@ -106216,159 +114127,187 @@ ] }, "limit": { - "context": 125000, - "output": 4096 + "context": 1048576, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "search": { + "supported": false + }, "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.15, + "input": 0.075, "output": 0.3 }, "type": "chat" }, { - "id": "osmosis/osmosis-structure-0.6b", - "name": "Osmosis Structure 0.6B", - "display_name": "Osmosis Structure 0.6B", + "id": "gemini-3.1-pro-preview-customtools", + "name": "Gemini 3.1 Pro Preview Custom Tools", + "display_name": "Gemini 3.1 Pro Preview Custom Tools", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 4000, - "output": 2048 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.1, - "output": 0.5 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" - } - ] - }, - "inception": { - "id": "inception", - "name": "Inception", - "display_name": "Inception", - "api": "https://api.inceptionlabs.ai/v1/", - "doc": "https://platform.inceptionlabs.ai/docs", - "models": [ + }, { - "id": "mercury-edit-2", - "name": "Mercury Edit 2", - "display_name": "Mercury Edit 2", + "id": "gemini-2.5-flash-image-preview", + "name": "Gemini 2.5 Flash Image Preview", + "display_name": "Gemini 2.5 Flash Image Preview", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-03-30", - "last_updated": "2026-03-30", + "knowledge": "2025-06", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", "cost": { - "input": 0.25, - "output": 0.75, - "cache_read": 0.025 + "input": 0.3, + "output": 30, + "cache_read": 0.075 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "mercury-2", - "name": "Mercury 2", - "display_name": "Mercury 2", + "id": "gemini-2.5-flash-preview-tts", + "name": "Gemini 2.5 Flash Preview TTS", + "display_name": "Gemini 2.5 Flash Preview TTS", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 128000, - "output": 50000 + "context": 8000, + "output": 16000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "knowledge": "2025-01", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", "cost": { - "input": 0.25, - "output": 0.75, - "cache_read": 0.025 + "input": 0.5, + "output": 10 }, "type": "chat" - } - ] - }, - "openai": { - "id": "openai", - "name": "OpenAI", - "display_name": "OpenAI", - "doc": "https://platform.openai.com/docs/models", - "models": [ + }, { - "id": "gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "gemini-2.5-flash-lite-preview-06-17", + "name": "Gemini 2.5 Flash Lite Preview 06-17", + "display_name": "Gemini 2.5 Flash Lite Preview 06-17", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -106378,86 +114317,100 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025, + "input_audio": 0.3 }, "type": "chat" }, { - "id": "gpt-4o-2024-05-13", - "name": "GPT-4o (2024-05-13)", - "display_name": "GPT-4o (2024-05-13)", + "id": "gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "knowledge": "2025-01", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 5, - "output": 15 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "o1-mini", - "name": "o1-mini", - "display_name": "o1-mini", + "id": "gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 1048576, "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -106466,46 +114419,68 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ + "mode": "level", + "level": "high", + "level_options": [ "low", - "medium", "high" ], - "visibility": "hidden" + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "gpt-5.2-pro", - "name": "GPT-5.2 Pro", - "display_name": "GPT-5.2 Pro", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -106515,165 +114490,110 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ + "mode": "level", + "level": "high", + "level_options": [ + "minimal", "low", "medium", "high" ], - "visibility": "hidden" + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 21, - "output": 168 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "input_audio": 1 }, "type": "chat" }, { - "id": "text-embedding-3-large", - "name": "text-embedding-3-large", - "display_name": "text-embedding-3-large", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8191, - "output": 3072 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-01", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", - "cost": { - "input": 0.13, - "output": 0 - }, - "type": "embedding" - }, - { - "id": "gpt-5.3-chat-latest", - "name": "GPT-5.3 Chat (latest)", - "display_name": "GPT-5.3 Chat (latest)", + "id": "gemini-live-2.5-flash", + "name": "Gemini Live 2.5 Flash", + "display_name": "Gemini Live 2.5 Flash", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { "context": 128000, - "output": 16384 + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "knowledge": "2025-01", + "release_date": "2025-09-01", + "last_updated": "2025-09-01", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.5, + "output": 2, + "input_audio": 3, + "output_audio": 12 }, "type": "chat" }, { - "id": "gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "gemma-3-12b-it", + "name": "Gemma 3 12B", + "display_name": "Gemma 3 12B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 32768, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", @@ -106684,177 +114604,149 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": -1, + "min": 0, + "max": 24576 + } }, "extra_capabilities": { "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, + "search": { + "supported": true, + "default": false + }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 }, "type": "chat" }, { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "gemini-2.5-flash-image", + "name": "Gemini 2.5 Flash Image", + "display_name": "Gemini 2.5 Flash Image", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32768, + "output": 32768 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-06", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 0.3, + "output": 30, + "cache_read": 0.075 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "search": { + "supported": true, + "default": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "gemini-1.5-pro", + "name": "Gemini 1.5 Pro", + "display_name": "Gemini 1.5 Pro", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -106863,19 +114755,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2024-04", + "release_date": "2024-02-15", + "last_updated": "2024-02-15", "cost": { - "input": 10, - "output": 30 + "input": 1.25, + "output": 5, + "cache_read": 0.3125 }, "type": "chat" }, { - "id": "text-embedding-ada-002", - "name": "text-embedding-ada-002", - "display_name": "text-embedding-ada-002", + "id": "gemini-embedding-001", + "name": "Gemini Embedding 001", + "display_name": "Gemini Embedding 001", "modalities": { "input": [ "text" @@ -106885,8 +114778,8 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 2048, + "output": 3072 }, "temperature": false, "tool_call": false, @@ -106895,19 +114788,19 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2022-12", - "release_date": "2022-12-15", - "last_updated": "2022-12-15", + "knowledge": "2025-05", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 0.1, + "input": 0.15, "output": 0 }, "type": "embedding" }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "gemma-3-4b-it", + "name": "Gemma 3 4B", + "display_name": "Gemma 3 4B", "modalities": { "input": [ "text", @@ -106918,140 +114811,107 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32768, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "o3-pro", - "name": "o3-pro", - "display_name": "o3-pro", + "id": "gemini-1.5-flash-8b", + "name": "Gemini 1.5 Flash-8B", + "display_name": "Gemini 1.5 Flash-8B", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1000000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-06-10", - "last_updated": "2025-06-10", + "knowledge": "2024-04", + "release_date": "2024-10-03", + "last_updated": "2024-10-03", "cost": { - "input": 20, - "output": 80 + "input": 0.0375, + "output": 0.15, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "gemini-2.0-flash-preview-image-generation", + "name": "Gemini 2.0 Flash Preview Image Generation", + "display_name": "Gemini 2.0 Flash Preview Image Generation", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", - "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "search": { + "supported": false }, + "attachment": true, "type": "chat" - }, + } + ] + }, + "sap-ai-core": { + "id": "sap-ai-core", + "name": "SAP AI Core", + "display_name": "SAP AI Core", + "doc": "https://help.sap.com/docs/sap-ai-core", + "models": [ { - "id": "o4-mini-deep-research", - "name": "o4-mini-deep-research", - "display_name": "o4-mini-deep-research", + "id": "anthropic--claude-3-opus", + "name": "anthropic--claude-3-opus", + "display_name": "anthropic--claude-3-opus", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -107059,105 +114919,92 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-06-26", - "last_updated": "2024-06-26", + "knowledge": "2023-08-31", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 mini", - "display_name": "GPT-5.4 mini", + "id": "gemini-2.5-pro", + "name": "gemini-2.5-pro", + "display_name": "gemini-2.5-pro", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2025-01", + "release_date": "2025-03-25", + "last_updated": "2025-06-05", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "anthropic--claude-4.5-haiku", + "name": "anthropic--claude-4.5-haiku", + "display_name": "anthropic--claude-4.5-haiku", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -107165,129 +115012,99 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "gpt-5.4-nano", - "name": "GPT-5.4 nano", - "display_name": "GPT-5.4 nano", + "id": "sonar", + "name": "sonar", + "display_name": "sonar", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 1, + "output": 1 }, "type": "chat" }, { - "id": "gpt-image-1", - "name": "gpt-image-1", - "display_name": "gpt-image-1", + "id": "anthropic--claude-3-sonnet", + "name": "anthropic--claude-3-sonnet", + "display_name": "anthropic--claude-3-sonnet", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-04-24", - "last_updated": "2025-04-24", - "type": "imageGeneration" + "knowledge": "2023-08-31", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "anthropic--claude-3-haiku", + "name": "anthropic--claude-3-haiku", + "display_name": "anthropic--claude-3-haiku", "modalities": { "input": [ "text", @@ -107299,314 +115116,251 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "gpt-5.2-chat-latest", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", + "id": "anthropic--claude-3.5-sonnet", + "name": "anthropic--claude-3.5-sonnet", + "display_name": "anthropic--claude-3.5-sonnet", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex mini", - "display_name": "GPT-5.1 Codex mini", + "id": "anthropic--claude-4.6-sonnet", + "name": "anthropic--claude-4.6-sonnet", + "display_name": "anthropic--claude-4.6-sonnet", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-08", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "o1-preview", - "name": "o1-preview", - "display_name": "o1-preview", + "id": "gpt-4.1", + "name": "gpt-4.1", + "display_name": "gpt-4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 1047576, "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "gpt-4o-2024-08-06", - "name": "GPT-4o (2024-08-06)", - "display_name": "GPT-4o (2024-08-06)", + "id": "anthropic--claude-4.5-sonnet", + "name": "anthropic--claude-4.5-sonnet", + "display_name": "anthropic--claude-4.5-sonnet", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-08-06", - "last_updated": "2024-08-06", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "gpt-4.1-mini", + "name": "gpt-4.1-mini", + "display_name": "gpt-4.1-mini", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1047576, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "gpt-image-1-mini", - "name": "gpt-image-1-mini", - "display_name": "gpt-image-1-mini", + "id": "sonar-deep-research", + "name": "sonar-deep-research", + "display_name": "sonar-deep-research", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 32768 }, "temperature": false, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-26", - "last_updated": "2025-09-26", - "type": "imageGeneration" + "knowledge": "2025-01", + "release_date": "2025-02-01", + "last_updated": "2025-09-01", + "cost": { + "input": 2, + "output": 8, + "reasoning": 3 + }, + "type": "chat" }, { - "id": "o1", - "name": "o1", - "display_name": "o1", + "id": "gemini-2.5-flash-lite", + "name": "gemini-2.5-flash-lite", + "display_name": "gemini-2.5-flash-lite", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -107614,45 +115368,51 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.1, + "output": 0.4, + "cache_read": 0.01, + "input_audio": 0.3 }, "type": "chat" }, { - "id": "gpt-5.4-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "gpt-5-nano", + "name": "gpt-5-nano", + "display_name": "gpt-5-nano", "modalities": { "input": [ "text", @@ -107663,7 +115423,7 @@ ] }, "limit": { - "context": 1050000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -107677,11 +115437,12 @@ "supported": true, "default_enabled": true, "mode": "effort", - "effort": "high", + "effort": "medium", "effort_options": [ + "minimal", + "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -107694,82 +115455,55 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", - "cost": { - "input": 30, - "output": 180, - "context_over_200k": { - "input": 60, - "output": 270 - } - }, - "type": "chat" - }, - { - "id": "gpt-3.5-turbo", - "name": "GPT-3.5-turbo", - "display_name": "GPT-3.5-turbo", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 16385, - "output": 4096 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2021-09-01", - "release_date": "2023-03-01", - "last_updated": "2023-11-06", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.5, - "output": 1.5, - "cache_read": 1.25 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "o3-deep-research", - "name": "o3-deep-research", - "display_name": "o3-deep-research", + "id": "gpt-5.4", + "name": "gpt-5.4", + "display_name": "gpt-5.4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1050000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -107779,104 +115513,62 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-06-26", - "last_updated": "2024-06-26", + "knowledge": "2025-08-31", + "release_date": "2026-04-27", + "last_updated": "2026-04-27", "cost": { - "input": 10, - "output": 40, - "cache_read": 2.5 + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "anthropic--claude-4.6-opus", + "name": "anthropic--claude-4.6-opus", + "display_name": "anthropic--claude-4.6-opus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1000000, + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "knowledge": "2025-05", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "text-embedding-3-small", - "name": "text-embedding-3-small", - "display_name": "text-embedding-3-small", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8191, - "output": 1536 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-01", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", - "cost": { - "input": 0.02, - "output": 0 - }, - "type": "embedding" - }, - { - "id": "o1-pro", - "name": "o1-pro", - "display_name": "o1-pro", + "id": "anthropic--claude-3.7-sonnet", + "name": "anthropic--claude-3.7-sonnet", + "display_name": "anthropic--claude-3.7-sonnet", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -107884,75 +115576,110 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Anthropic uses thinking budget tokens" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2025-03-19", - "last_updated": "2025-03-19", + "knowledge": "2024-10-31", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 150, - "output": 600 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "gemini-2.5-flash", + "name": "gemini-2.5-flash", + "display_name": "gemini-2.5-flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2025-01", + "release_date": "2025-04-17", + "last_updated": "2025-06-05", "cost": { - "input": 30, - "output": 60 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 }, "type": "chat" }, { - "id": "gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "gpt-5-mini", + "name": "gpt-5-mini", + "display_name": "gpt-5-mini", "modalities": { "input": [ "text", @@ -107993,22 +115720,22 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "anthropic--claude-4-sonnet", + "name": "anthropic--claude-4-sonnet", + "display_name": "anthropic--claude-4-sonnet", "modalities": { "input": [ "text", @@ -108020,72 +115747,47 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 2.5, + "input": 3, "output": 15, - "cache_read": 0.25, - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gpt-5.1-chat-latest", - "name": "GPT-5.1 Chat", - "display_name": "GPT-5.1 Chat", + "id": "anthropic--claude-4.5-opus", + "name": "anthropic--claude-4.5-opus", + "display_name": "anthropic--claude-4.5-opus", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -108093,153 +115795,140 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-05", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "gpt-5.3-codex-spark", - "name": "GPT-5.3 Codex Spark", - "display_name": "GPT-5.3 Codex Spark", + "id": "sonar-pro", + "name": "sonar-pro", + "display_name": "sonar-pro", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 200000, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "chatgpt-image-latest", - "name": "chatgpt-image-latest", - "display_name": "chatgpt-image-latest", + "id": "anthropic--claude-4.7-opus", + "name": "anthropic--claude-4.7-opus", + "display_name": "anthropic--claude-4.7-opus", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1000000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + }, "type": "chat" }, { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "anthropic--claude-4-opus", + "name": "anthropic--claude-4-opus", + "display_name": "anthropic--claude-4-opus", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.03 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "gpt-5", + "name": "gpt-5", + "display_name": "gpt-5", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -108254,6 +115943,13 @@ "mode": "effort", "effort": "medium", "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -108263,20 +115959,29 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" - }, + } + ] + }, + "scaleway": { + "id": "scaleway", + "name": "Scaleway", + "display_name": "Scaleway", + "api": "https://api.scaleway.ai/v1", + "doc": "https://www.scaleway.com/en/docs/generative-apis/", + "models": [ { - "id": "gpt-5-pro", - "name": "GPT-5 Pro", - "display_name": "GPT-5 Pro", + "id": "pixtral-12b-2409", + "name": "Pixtral 12B 2409", + "display_name": "Pixtral 12B 2409", "modalities": { "input": [ "text", @@ -108287,50 +115992,32 @@ ] }, "limit": { - "context": 400000, - "output": 272000 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "open_weights": true, + "release_date": "2024-09-25", + "last_updated": "2026-03-17", "cost": { - "input": 15, - "output": 120 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "mistral-small-3.2-24b-instruct-2506", + "name": "Mistral Small 3.2 24B Instruct (2506)", + "display_name": "Mistral Small 3.2 24B Instruct (2506)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -108338,85 +116025,58 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "attachment": false, + "open_weights": true, + "release_date": "2025-06-20", + "last_updated": "2026-03-17", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.15, + "output": 0.35 }, "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "mistral-nemo-instruct-2407", + "name": "Mistral Nemo Instruct 2407", + "display_name": "Mistral Nemo Instruct 2407", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "release_date": "2024-07-25", + "last_updated": "2026-03-17", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "gpt-5-chat-latest", - "name": "GPT-5 Chat (latest)", - "display_name": "GPT-5 Chat (latest)", + "id": "gemma-3-27b-it", + "name": "Gemma-3-27B-IT", + "display_name": "Gemma-3-27B-IT", "modalities": { "input": [ "text", @@ -108427,111 +116087,119 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 40000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2026-03-17", "cost": { - "input": 1.25, - "output": 10 + "input": 0.25, + "output": 0.5 }, "type": "chat" }, { - "id": "gpt-image-1.5", - "name": "gpt-image-1.5", - "display_name": "gpt-image-1.5", + "id": "bge-multilingual-gemma2", + "name": "BGE Multilingual Gemma2", + "display_name": "BGE Multilingual Gemma2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 8191, + "output": 3072 }, "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-25", - "last_updated": "2025-11-25", - "type": "imageGeneration" + "release_date": "2024-07-26", + "last_updated": "2025-06-15", + "cost": { + "input": 0.1, + "output": 0 + }, + "type": "chat" }, { - "id": "gpt-5.5-pro", - "name": "GPT-5.5 Pro", - "display_name": "GPT-5.5 Pro", + "id": "qwen3.5-397b-a17b", + "name": "Qwen3.5 397B A17B", + "display_name": "Qwen3.5 397B A17B", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 256000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", - "cost": { - "input": 30, - "output": 180, - "context_over_200k": { - "input": 60, - "output": 270 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", + "cost": { + "input": 0.6, + "output": 3.6 + }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "voxtral-small-24b-2507", + "name": "Voxtral Small 24B 2507", + "display_name": "Voxtral Small 24B 2507", "modalities": { "input": [ "text", - "image", - "pdf" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 32000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -108539,123 +116207,130 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "release_date": "2025-07-01", + "last_updated": "2026-03-17", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.15, + "output": 0.35 }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "qwen3-embedding-8b", + "name": "Qwen3 Embedding 8B", + "display_name": "Qwen3 Embedding 8B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 32768, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-25-11", + "last_updated": "2026-03-17", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0.1, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "whisper-large-v3", + "name": "Whisper Large v3", + "display_name": "Whisper Large v3", "modalities": { "input": [ - "text", - "image" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 8192 }, "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-09", + "release_date": "2023-09-01", + "last_updated": "2026-03-17", + "cost": { + "input": 0.003, + "output": 0 + }, + "type": "chat" + }, + { + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8196 + }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2026-03-17", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.9, + "output": 0.9 }, "type": "chat" }, { - "id": "gpt-4o-2024-11-20", - "name": "GPT-4o (2024-11-20)", - "display_name": "GPT-4o (2024-11-20)", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 260000, "output": 16384 }, "temperature": true, @@ -108664,63 +116339,51 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-11-20", - "last_updated": "2024-11-20", + "open_weights": true, + "release_date": "2025-07-01", + "last_updated": "2026-03-17", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.75, + "output": 2.25 }, "type": "chat" }, { - "id": "gpt-image-2", - "name": "gpt-image-2", - "display_name": "gpt-image-2", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder 30B-A3B Instruct", + "display_name": "Qwen3-Coder 30B-A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 32768 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2026-03-17", "cost": { - "input": 5, - "output": 30, - "cache_read": 1.25 + "input": 0.2, + "output": 0.8 }, - "type": "imageGeneration" - } - ] - }, - "requesty": { - "id": "requesty", - "name": "Requesty", - "display_name": "Requesty", - "api": "https://router.requesty.ai/v1", - "doc": "https://requesty.ai/solution/llm-routing/models", - "models": [ + "type": "chat" + }, { - "id": "xai/grok-4-fast", - "name": "Grok 4 Fast", - "display_name": "Grok 4 Fast", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -108730,50 +116393,45 @@ ] }, "limit": { - "context": 2000000, - "output": 64000 + "context": 100000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2026-03-17", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05, - "cache_write": 0.2 + "input": 0.9, + "output": 0.9 }, "type": "chat" }, { - "id": "xai/grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "gpt-oss-120b", + "name": "GPT-OSS 120B", + "display_name": "GPT-OSS 120B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -108781,126 +116439,104 @@ } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-09", - "last_updated": "2025-09-09", + "open_weights": true, + "release_date": "2024-01-01", + "last_updated": "2026-03-17", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75, - "cache_write": 3 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-max", - "name": "GPT-5.1-Codex-Max", - "display_name": "GPT-5.1-Codex-Max", + "id": "devstral-2-123b-instruct-2512", + "name": "Devstral 2 123B Instruct (2512)", + "display_name": "Devstral 2 123B Instruct (2512)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "release_date": "2026-01-07", + "last_updated": "2026-03-17", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "openai/gpt-5-chat", - "name": "GPT-5 Chat (latest)", - "display_name": "GPT-5 Chat (latest)", + "id": "llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2026-03-17", "cost": { - "input": 1.25, - "output": 10 + "input": 0.2, + "output": 0.2 }, "type": "chat" - }, + } + ] + }, + "opencode": { + "id": "opencode", + "name": "OpenCode Zen", + "display_name": "OpenCode Zen", + "api": "https://opencode.ai/zen/v1", + "doc": "https://opencode.ai/docs/zen", + "models": [ { - "id": "openai/gpt-5.2-pro", - "name": "GPT-5.2 Pro", - "display_name": "GPT-5.2 Pro", + "id": "minimax-m2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -108909,52 +116545,45 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 21, - "output": 168 + "input": 0.3, + "output": 1.2, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -108963,53 +116592,45 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 + "input": 0.6, + "output": 3, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -109018,40 +116639,31 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 + "input": 0.2, + "output": 1.2, + "cache_read": 0.02, + "cache_write": 0.25 }, "type": "chat" }, { - "id": "openai/gpt-5.3-codex", - "name": "GPT-5.3-Codex", - "display_name": "GPT-5.3-Codex", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", @@ -109063,10 +116675,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -109074,87 +116686,84 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o Mini", - "display_name": "GPT-4o Mini", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "openai/gpt-5.1-chat", - "name": "GPT-5.1 Chat", - "display_name": "GPT-5.1 Chat", + "id": "kimi-k2.5-free", + "name": "Kimi K2.5 Free", + "display_name": "Kimi K2.5 Free", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -109162,34 +116771,48 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "o4 Mini", - "display_name": "o4 Mini", + "id": "gemini-3-pro", + "name": "Gemini 3 Pro", + "display_name": "Gemini 3 Pro", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -109201,32 +116824,51 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ + "mode": "level", + "level": "high", + "level_options": [ "low", - "medium", "high" ], - "visibility": "hidden" + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "openai/gpt-5.2-codex", - "name": "GPT-5.2-Codex", - "display_name": "GPT-5.2-Codex", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", @@ -109240,19 +116882,20 @@ "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ + "none", "low", "medium", "high", @@ -109270,8 +116913,8 @@ "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { "input": 1.75, "output": 14, @@ -109280,13 +116923,59 @@ "type": "chat" }, { - "id": "openai/gpt-5.1-codex-mini", - "name": "GPT-5.1-Codex-Mini", - "display_name": "GPT-5.1-Codex-Mini", + "id": "glm-5-free", + "name": "GLM-5 Free", + "display_name": "GLM-5 Free", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 + }, + "type": "chat" + }, + { + "id": "gpt-5.4-nano", + "name": "GPT-5.4 Nano", + "display_name": "GPT-5.4 Nano", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -109294,9 +116983,9 @@ }, "limit": { "context": 400000, - "output": 100000 + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -109312,7 +117001,8 @@ "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -109325,20 +117015,59 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "openai/gpt-5-image", - "name": "GPT-5 Image", - "display_name": "GPT-5 Image", + "id": "minimax-m2.1-free", + "name": "MiniMax M2.1 Free", + "display_name": "MiniMax M2.1 Free", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 + }, + "type": "chat" + }, + { + "id": "gpt-5.5-pro", + "name": "GPT-5.5 Pro", + "display_name": "GPT-5.5 Pro", "modalities": { "input": [ "text", @@ -109346,36 +117075,40 @@ "pdf" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, + "context": 1050000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-10-14", - "last_updated": "2025-10-14", + "knowledge": "2025-12-01", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 5, - "output": 10, - "cache_read": 1.25 + "input": 30, + "output": 180, + "cache_read": 30 }, "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex Mini", + "display_name": "GPT-5.1 Codex Mini", "modalities": { "input": [ "text", @@ -109389,7 +117122,7 @@ "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -109422,16 +117155,16 @@ "release_date": "2025-11-13", "last_updated": "2025-11-13", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "openai/gpt-5.4-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", @@ -109443,10 +117176,10 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 1000000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -109455,51 +117188,55 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 30, - "output": 180, - "cache_read": 30 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5 + } }, "type": "chat" }, { - "id": "openai/gpt-5-codex", - "name": "GPT-5 Codex", - "display_name": "GPT-5 Codex", + "id": "mimo-v2-flash-free", + "name": "MiMo V2 Flash Free", + "display_name": "MiMo V2 Flash Free", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -109510,55 +117247,40 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "gpt-5.3-codex-spark", + "name": "GPT-5.3 Codex Spark", + "display_name": "GPT-5.3 Codex Spark", "modalities": { "input": [ - "text", - "audio", - "image", - "video" + "text" ], "output": [ - "text", - "audio", - "image" + "text" ] }, "limit": { - "context": 400000, + "context": 128000, "output": 128000 }, "temperature": false, @@ -109574,10 +117296,10 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "minimal", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -109588,56 +117310,99 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-08-31", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1 Mini", - "display_name": "GPT-4.1 Mini", + "id": "trinity-large-preview-free", + "name": "Trinity Large Preview", + "display_name": "Trinity Large Preview", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2026-01-28", + "last_updated": "2026-01-28", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex", - "name": "GPT-5.1-Codex", - "display_name": "GPT-5.1-Codex", + "id": "deepseek-v4-flash-free", + "name": "DeepSeek V4 Flash Free", + "display_name": "DeepSeek V4 Flash Free", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 + }, + "type": "chat" + }, + { + "id": "gpt-5-codex", + "name": "GPT-5 Codex", + "display_name": "GPT-5 Codex", "modalities": { "input": [ "text", @@ -109651,20 +117416,20 @@ "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", + "minimal", "low", "medium", "high" @@ -109681,34 +117446,30 @@ "attachment": true, "open_weights": false, "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 }, "type": "chat" }, { - "id": "google/gemini-3-flash-preview", - "name": "Gemini 3 Flash", - "display_name": "Gemini 3 Flash", + "id": "minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -109719,46 +117480,33 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, + "attachment": false, + "open_weights": true, "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "cache_write": 1 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "google/gemini-3-pro-preview", - "name": "Gemini 3 Pro", - "display_name": "Gemini 3 Pro", + "id": "mimo-v2-pro-free", + "name": "MiMo V2 Pro Free", + "display_name": "MiMo V2 Pro Free", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" @@ -109766,7 +117514,7 @@ }, "limit": { "context": 1048576, - "output": 65536 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -109777,52 +117525,41 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "cache_write": 4.5 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -109832,87 +117569,62 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.55 + "input": 0.6, + "output": 2.2, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "ling-2.6-flash-free", + "name": "Ling 2.6 Flash Free", + "display_name": "Ling 2.6 Flash Free", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 62000 + "context": 262100, + "output": 32800 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-01", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-6", + "id": "claude-sonnet-4-6", "name": "Claude Sonnet 4.6", "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -109920,7 +117632,7 @@ }, "limit": { "context": 1000000, - "output": 128000 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -109963,90 +117675,72 @@ "input": 3, "output": 15, "cache_read": 0.3, - "cache_write": 3.75, - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5 - } + "cache_write": 3.75 }, "type": "chat" }, { - "id": "anthropic/claude-3-7-sonnet", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "glm-4.7-free", + "name": "GLM-4.7 Free", + "display_name": "GLM-4.7 Free", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", + "interleaved": true, + "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-01", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "qwen3.6-plus-free", + "name": "Qwen3.6 Plus Free", + "display_name": "Qwen3.6 Plus Free", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -110056,39 +117750,42 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "minimax-m2.7", + "name": "MiniMax M2.7", + "display_name": "MiniMax M2.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -110096,196 +117793,166 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "qwen3-coder", + "name": "Qwen3 Coder", + "display_name": "Qwen3 Coder", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25, - "context_over_200k": { - "input": 10, - "output": 37.5, - "cache_read": 1, - "cache_write": 12.5 - } + "input": 0.45, + "output": 1.8 }, "type": "chat" }, { - "id": "openai/gpt-5.2-chat", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", + "id": "claude-opus-4-1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": false + "context": 262144, + "output": 65536 }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 0.625 }, "type": "chat" }, { - "id": "openai/gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -110304,8 +117971,7 @@ "none", "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -110318,25 +117984,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 }, "type": "chat" }, { - "id": "openai/gpt-5-pro", - "name": "GPT-5 Pro", - "display_name": "GPT-5 Pro", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ "text", @@ -110348,7 +118009,7 @@ }, "limit": { "context": 400000, - "output": 272000 + "output": 128000 }, "temperature": false, "tool_call": true, @@ -110360,8 +118021,14 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "fixed", - "effort": "high", + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], "verbosity": "medium", "verbosity_options": [ "low", @@ -110373,68 +118040,31 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 15, - "output": 120 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 1047576, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, - "type": "chat" - }, - { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video", - "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -110445,44 +118075,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31, - "cache_write": 2.375, - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 0.4, + "output": 2.5, + "cache_read": 0.4 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "gpt-5.4-mini", + "name": "GPT-5.4 Mini", + "display_name": "GPT-5.4 Mini", "modalities": { "input": [ "text", @@ -110494,49 +118110,63 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "hy3-preview-free", + "name": "Hy3 preview Free", + "display_name": "Hy3 preview Free", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 256000, "output": 64000 }, "temperature": true, @@ -110545,23 +118175,22 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2026-04-20", + "last_updated": "2026-04-20", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", @@ -110574,49 +118203,61 @@ }, "limit": { "context": 1000000, - "output": 64000 + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" - } - ] - }, - "digitalocean": { - "id": "digitalocean", - "name": "DigitalOcean", - "display_name": "DigitalOcean", - "api": "https://inference.do-ai.run/v1", - "doc": "https://docs.digitalocean.com/products/gradient-ai-platform/details/models/", - "models": [ + }, { - "id": "openai-gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "gemini-3-flash", + "name": "Gemini 3 Flash", + "display_name": "Gemini 3 Flash", "modalities": { "input": [ "text", "image", + "video", + "audio", "pdf" ], "output": [ @@ -110624,30 +118265,50 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 + "input": 0.5, + "output": 3, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "multi-qa-mpnet-base-dot-v1", - "name": "Multi-QA-mpnet-base-dot-v1", - "display_name": "Multi-QA-mpnet-base-dot-v1", + "id": "minimax-m2.5-free", + "name": "MiniMax M2.5 Free", + "display_name": "MiniMax M2.5 Free", "modalities": { "input": [ "text" @@ -110657,107 +118318,148 @@ ] }, "limit": { - "context": 512, - "output": 768 + "context": 204800, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2021-08-30", - "last_updated": "2026-04-16", + "knowledge": "2025-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.009, - "output": 0 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-04-16", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.5, - "output": 2.7 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "nemotron-3-nano-omni", - "name": "Nemotron Nano 3 Omni", - "display_name": "Nemotron Nano 3 Omni", + "id": "gpt-5.4-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ "text", "image", - "video", - "audio" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-28", - "last_updated": "2026-04-30", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.5, - "output": 0.9 + "input": 30, + "output": 180, + "cache_read": 30 }, "type": "chat" }, { - "id": "llama3-8b-instruct", - "name": "Llama 3.1 Instruct (8B)", - "display_name": "Llama 3.1 Instruct (8B)", + "id": "big-pickle", + "name": "Big Pickle", + "display_name": "Big Pickle", "modalities": { "input": [ "text" @@ -110767,88 +118469,41 @@ ] }, "limit": { - "context": 131072, - "output": 131072 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 0.198, - "output": 0.198 - }, - "type": "chat" - }, - { - "id": "anthropic-claude-opus-4.7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, + "context": 200000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], "interleaved": true, "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2025-01", + "release_date": "2025-10-17", + "last_updated": "2025-10-17", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "anthropic-claude-sonnet-4", + "id": "claude-sonnet-4", "name": "Claude Sonnet 4", "display_name": "Claude Sonnet 4", "modalities": { @@ -110881,50 +118536,87 @@ "output": 15, "cache_read": 0.3, "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], "context_over_200k": { "input": 6, "output": 22.5, - "cache_read": 0.3, - "cache_write": 3.75 + "cache_read": 0.6, + "cache_write": 7.5 } }, "type": "chat" }, { - "id": "wan2-2-t2v-a14b", - "name": "Wan2.2-T2V-A14B", - "display_name": "Wan2.2-T2V-A14B", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 100, - "output": 1 + "context": 400000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2026-04-30", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.6, - "output": 0 + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 }, "type": "chat" }, { - "id": "qwen-2.5-14b-instruct", - "name": "Qwen 2.5 14B Instruct", - "display_name": "Qwen 2.5 14B Instruct", + "id": "kimi-k2", + "name": "Kimi K2", + "display_name": "Kimi K2", "modalities": { "input": [ "text" @@ -110934,8 +118626,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -110944,15 +118636,20 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-09-19", - "last_updated": "2024-09-19", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "cost": { + "input": 0.4, + "output": 2.5, + "cache_read": 0.4 + }, "type": "chat" }, { - "id": "openai-gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "claude-3-5-haiku", + "name": "Claude Haiku 3.5", + "display_name": "Claude Haiku 3.5", "modalities": { "input": [ "text", @@ -110964,44 +118661,46 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 200000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "qwen3.5-397b-a17b", - "name": "Qwen 3.5 397B A17B", - "display_name": "Qwen 3.5 397B A17B", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 81920 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -111010,43 +118709,53 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-15", - "last_updated": "2026-04-30", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 0.55, - "output": 3.5 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "openai-o3", - "name": "o3", - "display_name": "o3", + "id": "grok-code", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 256000, + "output": 256000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -111054,55 +118763,25 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", - "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, - "type": "chat" - }, - { - "id": "e5-large-v2", - "name": "E5 Large v2", - "display_name": "E5 Large v2", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 512, - "output": 1024 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2023-05-19", - "last_updated": "2026-04-30", + "release_date": "2025-08-20", + "last_updated": "2025-08-20", "cost": { - "input": 0.02, - "output": 0 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai-gpt-5.2-pro", - "name": "GPT-5.2 pro", - "display_name": "GPT-5.2 pro", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -111118,21 +118797,43 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 21, - "output": 168 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM 5", - "display_name": "GLM 5", + "id": "ring-2.6-1t-free", + "name": "Ring 2.6 1T Free", + "display_name": "Ring 2.6 1T Free", "modalities": { "input": [ "text" @@ -111142,9 +118843,10 @@ ] }, "limit": { - "context": 202752, - "output": 128000 + "context": 262000, + "output": 66000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -111163,53 +118865,64 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-04-16", + "knowledge": "2025-06", + "release_date": "2026-05-08", + "last_updated": "2026-05-08", "cost": { - "input": 1, - "output": 3.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai-gpt-5.4-nano", - "name": "GPT-5.4 nano", - "display_name": "GPT-5.4 nano", + "id": "nemotron-3-super-free", + "name": "Nemotron 3 Super Free", + "display_name": "Nemotron 3 Super Free", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 204800, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2026-02", + "release_date": "2026-03-11", + "last_updated": "2026-03-11", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "mistral-7b-instruct-v0.3", - "name": "Mistral 7B Instruct v0.3", - "display_name": "Mistral 7B Instruct v0.3", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -111219,24 +118932,42 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2024-05-22", - "last_updated": "2024-05-22", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "cost": { + "input": 0.6, + "output": 2.2, + "cache_read": 0.1 + }, "type": "chat" }, { - "id": "llama3.3-70b-instruct", - "name": "Llama 3.3 Instruct 70B", - "display_name": "Llama 3.3 Instruct 70B", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -111246,71 +118977,126 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2025-04", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.65, - "output": 0.65 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "mistral-3-14B", - "name": "Ministral 3 14B Instruct", - "display_name": "Ministral 3 14B Instruct", + "id": "gemini-3.1-pro", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 128000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-15", - "last_updated": "2026-04-30", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.2, - "output": 0.2 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -111320,34 +119106,45 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-01-30", - "last_updated": "2025-01-30", + "knowledge": "2024-10", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.99, - "output": 0.99 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "alibaba-qwen3-32b", - "name": "Qwen3-32B", - "display_name": "Qwen3-32B", + "id": "mimo-v2-omni-free", + "name": "MiMo V2 Omni Free", + "display_name": "MiMo V2 Omni Free", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 40960 + "context": 262144, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -111355,18 +119152,31 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "release_date": "2025-04-30", - "last_updated": "2026-04-16", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.25, - "output": 0.55 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "anthropic-claude-opus-4.5", + "id": "claude-opus-4-5", "name": "Claude Opus 4.5", "display_name": "Claude Opus 4.5", "modalities": { @@ -111389,6 +119199,11 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, "knowledge": "2025-03-31", @@ -111403,22 +119218,21 @@ "type": "chat" }, { - "id": "openai-o1", - "name": "o1", - "display_name": "o1", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -111426,169 +119240,316 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 }, "type": "chat" }, { - "id": "anthropic-claude-3-opus", - "name": "Claude 3 Opus", - "display_name": "Claude 3 Opus", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2023-08", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + }, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "stable-diffusion-3.5-large", - "name": "Stable Diffusion 3.5 Large", - "display_name": "Stable Diffusion 3.5 Large", + "id": "gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 256, - "output": 1 + "context": 1050000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-10-22", - "last_updated": "2026-04-30", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0.08, - "output": 0 + "input": 5, + "output": 30, + "cache_read": 0.5, + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + }, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "openai-gpt-5-nano", - "name": "GPT-5 nano", - "display_name": "GPT-5 nano", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" - }, + } + ] + }, + "mixlayer": { + "id": "mixlayer", + "name": "Mixlayer", + "display_name": "Mixlayer", + "api": "https://models.mixlayer.ai/v1", + "doc": "https://docs.mixlayer.com", + "models": [ { - "id": "llama-4-maverick", - "name": "Llama 4 Maverick 17B 128E Instruct", - "display_name": "Llama 4 Maverick 17B 128E Instruct", + "id": "qwen/qwen3.5-122b-a10b", + "name": "Qwen3.5 122B A10B", + "display_name": "Qwen3.5 122B A10B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2026-04-30", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.25, - "output": 0.87 + "input": 0.4, + "output": 3.2 }, "type": "chat" }, { - "id": "anthropic-claude-4.5-sonnet", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "qwen/qwen3.5-397b-a17b", + "name": "Qwen3.5 397B A17B", + "display_name": "Qwen3.5 397B A17B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -111596,29 +119557,31 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.3, - "cache_write": 3.75 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0.6, + "output": 3.6 + }, "type": "chat" }, { - "id": "qwen3-embedding-0.6b", - "name": "Qwen3 Embedding 0.6B", - "display_name": "Qwen3 Embedding 0.6B", + "id": "qwen/qwen3.5-9b", + "name": "Qwen3.5 9B", + "display_name": "Qwen3.5 9B", "modalities": { "input": [ "text" @@ -111628,40 +119591,51 @@ ] }, "limit": { - "context": 8000, - "output": 1024 + "context": 262144, + "output": 262144 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2025-06-03", - "last_updated": "2026-04-16", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.04, - "output": 0 + "input": 0.1, + "output": 0.4 }, - "type": "embedding" + "type": "chat" }, { - "id": "anthropic-claude-4.5-haiku", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "qwen/qwen3.5-35b-a3b", + "name": "Qwen3.5 35B A3B", + "display_name": "Qwen3.5 35B A3B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -111669,23 +119643,31 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1, - "output": 5, - "cache_read": 1, - "cache_write": 1.25 + "input": 0.25, + "output": 1.3 }, "type": "chat" }, { - "id": "gte-large-en-v1.5", - "name": "GTE Large (v1.5)", - "display_name": "GTE Large (v1.5)", + "id": "qwen/qwen3.5-27b", + "name": "Qwen3.5 27B", + "display_name": "Qwen3.5 27B", "modalities": { "input": [ "text" @@ -111695,97 +119677,162 @@ ] }, "limit": { - "context": 8192, - "output": 1024 + "context": 262144, + "output": 262144 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2024-03-27", - "last_updated": "2026-04-16", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.09, - "output": 0 + "input": 0.3, + "output": 2.4 }, "type": "chat" - }, + } + ] + }, + "perplexity-agent": { + "id": "perplexity-agent", + "name": "Perplexity Agent", + "display_name": "Perplexity Agent", + "api": "https://api.perplexity.ai/v1", + "doc": "https://docs.perplexity.ai/docs/agent-api/models", + "models": [ { - "id": "openai-gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "anthropic-claude-3.5-haiku", - "name": "Claude 3.5 Haiku", - "display_name": "Claude 3.5 Haiku", + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-11-05", - "last_updated": "2024-11-05", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai-gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "openai/gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", @@ -111796,44 +119843,68 @@ ] }, "limit": { - "context": 400000, + "context": 1050000, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "deepseek-3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "openai/gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -111842,69 +119913,106 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-12-02", - "last_updated": "2026-04-30", + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0.5, - "output": 1.6 + "input": 5, + "output": 30, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "nemotron-3-nano-30b", - "name": "Nemotron 3 Nano 30B A3B", - "display_name": "Nemotron 3 Nano 30B A3B", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.025 + }, "type": "chat" }, { - "id": "anthropic-claude-opus-4", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "nvidia/nemotron-3-super-120b-a12b", + "name": "Nemotron 3 Super 120B", + "display_name": "Nemotron 3 Super 120B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 1000000, "output": 32000 }, "temperature": true, @@ -111913,34 +120021,34 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "knowledge": "2026-02", + "release_date": "2026-03-11", + "last_updated": "2026-03-11", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.25, + "output": 2.5 }, "type": "chat" }, { - "id": "openai-gpt-oss-20b", - "name": "gpt-oss-20b", - "display_name": "gpt-oss-20b", + "id": "anthropic/claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -111948,56 +120056,73 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-08-05", - "last_updated": "2026-04-16", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.05, - "output": 0.45 + "input": 1, + "output": 5, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "qwen3-coder-flash", - "name": "Qwen3 Coder Flash", - "display_name": "Qwen3 Coder Flash", + "id": "anthropic/claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2026-04-30", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.45, - "output": 1.7 + "input": 3, + "output": 15, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "openai-o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "anthropic/claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -112005,118 +120130,191 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 3, + "output": 15, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "openai-gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "anthropic/claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], "interleaved": true, "summaries": true, - "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-08-05", + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", "last_updated": "2026-04-16", "cost": { - "input": 0.1, - "output": 0.7 + "input": 5, + "output": 25, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "gemma-4-31B-it", - "name": "Gemma 4 31B", - "display_name": "Gemma 4 31B", + "id": "anthropic/claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-22", - "last_updated": "2026-04-30", + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.18, - "output": 0.5 + "input": 5, + "output": 25, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "nemotron-nano-12b-v2-vl", - "name": "Nemotron Nano 12B v2 VL", - "display_name": "Nemotron Nano 12B v2 VL", + "id": "anthropic/claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -112124,25 +120322,33 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-12-01", - "last_updated": "2026-04-30", + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.2, - "output": 0.6 + "input": 5, + "output": 25, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "anthropic-claude-4.1-opus", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -112150,8 +120356,8 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -112159,37 +120365,74 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + } }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "google/gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -112198,61 +120441,131 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, - "open_weights": true, + "open_weights": false, "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.95, - "output": 4 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "openai-gpt-image-2", - "name": "GPT Image 2", - "display_name": "GPT Image 2", + "id": "google/gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048576, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-04-24", - "last_updated": "2025-04-24", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", + "cost": { + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "tiers": [ + { + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 0.5, + "output": 3, + "cache_read": 0.05 + } + }, "type": "chat" }, { - "id": "anthropic-claude-4.6-sonnet", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -112260,8 +120573,8 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -112269,112 +120582,131 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.3, - "cache_write": 3.75 - } + "input": 0.3, + "output": 2.5, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "openai-gpt-5-mini", - "name": "GPT-5 mini", - "display_name": "GPT-5 mini", + "id": "perplexity/sonar", + "name": "Sonar", + "display_name": "Sonar", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { "input": 0.25, - "output": 2, - "cache_read": 0.025 + "output": 2.5, + "cache_read": 0.0625 }, "type": "chat" }, { - "id": "anthropic-claude-haiku-4.5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "xai/grok-4-1-fast-non-reasoning", + "name": "Grok 4.1 Fast (Non-Reasoning)", + "display_name": "Grok 4.1 Fast (Non-Reasoning)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2025-07", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "cost": { - "input": 1, - "output": 5, - "cache_read": 1, - "cache_write": 1.25 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" - }, + } + ] + }, + "alibaba-coding-plan": { + "id": "alibaba-coding-plan", + "name": "Alibaba Coding Plan", + "display_name": "Alibaba Coding Plan", + "api": "https://coding-intl.dashscope.aliyuncs.com/v1", + "doc": "https://www.alibabacloud.com/help/en/model-studio/coding-plan", + "models": [ { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -112393,60 +120725,36 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 1.74, - "output": 3.48 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "ministral-3-8b-instruct-2512", - "name": "Ministral 3 8B", - "display_name": "Ministral 3 8B", + "id": "qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 262144 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2025-12-15", - "last_updated": "2025-12-15", - "type": "chat" - }, - { - "id": "minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", - "modalities": { - "input": [ - "text" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 128000 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -112456,62 +120764,70 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-08", - "release_date": "2026-02-12", - "last_updated": "2026-04-16", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai-gpt-image-1", - "name": "GPT Image 1", - "display_name": "GPT Image 1", + "id": "qwen3-coder-next", + "name": "Qwen3 Coder Next", + "display_name": "Qwen3 Coder Next", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-24", - "last_updated": "2025-04-24", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-03", + "last_updated": "2026-02-03", "cost": { - "input": 5, - "output": 40, - "cache_read": 1.25 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai-gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" @@ -112519,35 +120835,42 @@ }, "limit": { "context": 1000000, - "output": 128000 + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-30", + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "nvidia-nemotron-3-super-120b", - "name": "Nemotron-3-Super-120B", - "display_name": "Nemotron-3-Super-120B", + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -112557,8 +120880,8 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 196608, + "output": 24576 }, "temperature": true, "tool_call": true, @@ -112566,55 +120889,78 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2026-02", - "release_date": "2026-03-11", - "last_updated": "2026-04-16", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.3, - "output": 0.65 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai-gpt-5.4-pro", - "name": "GPT-5.4 pro", - "display_name": "GPT-5.4 pro", + "id": "qwen3-max-2026-01-23", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2025-04", + "release_date": "2026-01-23", + "last_updated": "2026-01-23", "cost": { - "input": 30, - "output": 180 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "all-mini-lm-l6-v2", - "name": "All-MiniLM-L6-v2", - "display_name": "All-MiniLM-L6-v2", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -112624,28 +120970,43 @@ ] }, "limit": { - "context": 256, - "output": 384 + "context": 202752, + "output": 16384 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2021-08-30", - "last_updated": "2026-04-16", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.009, - "output": 0 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "bge-m3", - "name": "BGE M3", - "display_name": "BGE M3", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -112655,237 +121016,222 @@ ] }, "limit": { - "context": 8192, - "output": 1024 + "context": 202752, + "output": 16384 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, - "release_date": "2024-01-30", - "last_updated": "2026-04-30", + "open_weights": false, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.02, - "output": 0 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, - "type": "embedding" + "type": "chat" }, { - "id": "openai-gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "meganova": { + "id": "meganova", + "name": "Meganova", + "display_name": "Meganova", + "api": "https://api.meganova.ai/v1", + "doc": "https://docs.meganova.ai", + "models": [ { - "id": "anthropic-claude-opus-4.6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 163840, + "output": 64000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25, - "context_over_200k": { - "input": 10, - "output": 37.5, - "cache_read": 0.5, - "cache_write": 6.25 - } + "input": 0.5, + "output": 2.15 }, "type": "chat" }, { - "id": "openai-gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-25", + "last_updated": "2025-08-25", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "openai-gpt-5.4-mini", - "name": "GPT-5.4 mini", - "display_name": "GPT-5.4 mini", + "id": "deepseek-ai/DeepSeek-V3-0324", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 163840, + "output": 163840 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 0.25, + "output": 0.88 }, "type": "chat" }, { - "id": "openai-gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "deepseek-ai/DeepSeek-V3.2-Exp", + "name": "DeepSeek V3.2 Exp", + "display_name": "DeepSeek V3.2 Exp", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 164000, + "output": 164000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "release_date": "2025-10-10", + "last_updated": "2025-10-10", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.27, + "output": 0.4 }, "type": "chat" }, { - "id": "arcee-trinity-large-thinking", - "name": "Trinity Large Thinking", - "display_name": "Trinity Large Thinking", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -112895,30 +121241,33 @@ ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-16", + "release_date": "2025-12-03", + "last_updated": "2025-12-03", "cost": { - "input": 0.25, - "output": 0.9, - "cache_read": 0.06 + "input": 0.26, + "output": 0.38 }, "type": "chat" }, { - "id": "mistral-nemo-instruct-2407", - "name": "Mistral Nemo Instruct", - "display_name": "Mistral Nemo Instruct", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -112928,56 +121277,86 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.3, - "output": 0.3 + "input": 0.6, + "output": 2.6 }, "type": "chat" }, { - "id": "deepseek-v3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-12-26", - "last_updated": "2025-03-24", + "knowledge": "2026-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "cost": { + "input": 0.45, + "output": 2.8 + }, "type": "chat" }, { - "id": "bge-reranker-v2-m3", - "name": "BGE Reranker v2 M3", - "display_name": "BGE Reranker v2 M3", + "id": "zai-org/GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -112987,180 +121366,159 @@ ] }, "limit": { - "context": 8192, - "output": 1 + "context": 202752, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2024-03-12", - "last_updated": "2026-04-30", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.01, - "output": 0 + "input": 0.2, + "output": 0.8 }, - "type": "rerank" + "type": "chat" }, { - "id": "anthropic-claude-3.7-sonnet", - "name": "Claude 3.7 Sonnet", - "display_name": "Claude 3.7 Sonnet", + "id": "zai-org/GLM-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", + "interleaved": true, + "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.8, + "output": 2.56 }, "type": "chat" }, { - "id": "qwen3-tts-voicedesign", - "name": "Qwen3 TTS VoiceDesign", - "display_name": "Qwen3 TTS VoiceDesign", + "id": "zai-org/GLM-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" ], "output": [ - "audio" - ] - }, - "limit": { - "context": 32768, - "output": 1 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-21", - "last_updated": "2026-04-30", - "type": "chat" - }, - { - "id": "openai-gpt-image-1.5", - "name": "GPT Image 1.5", - "display_name": "GPT Image 1.5", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 202752, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-25", - "last_updated": "2025-11-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 5, - "output": 10, - "cache_read": 1 + "input": 0.45, + "output": 1.9 }, "type": "chat" }, { - "id": "openai-gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "mistralai/Mistral-Nemo-Instruct-2407", + "name": "Mistral Nemo Instruct 2407", + "display_name": "Mistral Nemo Instruct 2407", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.02, + "output": 0.04 }, "type": "chat" }, { - "id": "anthropic-claude-3.5-sonnet", - "name": "Claude 3.5 Sonnet", - "display_name": "Claude 3.5 Sonnet", + "id": "mistralai/Mistral-Small-3.2-24B-Instruct-2506", + "name": "Mistral Small 3.2 24B Instruct", + "display_name": "Mistral Small 3.2 24B Instruct", "modalities": { "input": [ "text", @@ -113171,7 +121529,7 @@ ] }, "limit": { - "context": 200000, + "context": 32768, "output": 8192 }, "temperature": true, @@ -113180,176 +121538,217 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-06-20", - "last_updated": "2024-10-22", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-06-20", + "last_updated": "2025-06-20", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "fal-ai/fast-sdxl", - "name": "Fast SDXL", - "display_name": "Fast SDXL", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 16384 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2023-07-26", - "last_updated": "2026-04-16", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.1, + "output": 0.3 + }, "type": "chat" }, { - "id": "fal-ai/flux/schnell", - "name": "FLUX.1 [schnell]", - "display_name": "FLUX.1 [schnell]", + "id": "XiaomiMiMo/MiMo-V2-Flash", + "name": "MiMo V2 Flash", + "display_name": "MiMo V2 Flash", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 32000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-08-01", - "last_updated": "2026-04-16", + "knowledge": "2024-12-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", + "cost": { + "input": 0.1, + "output": 0.3 + }, "type": "chat" }, { - "id": "fal-ai/elevenlabs/tts/multilingual-v2", - "name": "ElevenLabs Multilingual TTS v2", - "display_name": "ElevenLabs Multilingual TTS v2", + "id": "MiniMaxAI/MiniMax-M2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 196608, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2023-08-22", - "last_updated": "2026-04-16", + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "cost": { + "input": 0.28, + "output": 1.2 + }, "type": "chat" }, { - "id": "fal-ai/stable-audio-25/text-to-audio", - "name": "Stable Audio 2.5 (Text-to-Audio)", - "display_name": "Stable Audio 2.5 (Text-to-Audio)", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 204800, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-10-08", - "last_updated": "2026-04-16", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "cost": { + "input": 0.3, + "output": 1.2 + }, "type": "chat" - } - ] - }, - "vultr": { - "id": "vultr", - "name": "Vultr", - "display_name": "Vultr", - "api": "https://api.vultrinference.com/v1", - "doc": "https://api.vultrinference.com/", - "models": [ + }, { - "id": "MiniMax-M2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "Qwen/Qwen3.5-Plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 194000, - "output": 4096 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-09", - "release_date": "2025-02-11", - "last_updated": "2025-02-11", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-02", + "last_updated": "2026-02", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.4, + "output": 2.4, + "reasoning": 2.4 }, "type": "chat" }, { - "id": "GLM-5-FP8", - "name": "GLM 5 FP8", - "display_name": "GLM 5 FP8", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -113359,8 +121758,8 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -113369,56 +121768,59 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.85, - "output": 3.1 + "input": 0.09, + "output": 0.6 }, "type": "chat" }, { - "id": "DeepSeek-V3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen2.5 VL 32B Instruct", + "display_name": "Qwen2.5 VL 32B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 127000, - "output": 4096 + "context": 16384, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 0.55, - "output": 1.65 + "input": 0.2, + "output": 0.6 }, "type": "chat" - }, + } + ] + }, + "synthetic": { + "id": "synthetic", + "name": "Synthetic", + "display_name": "Synthetic", + "api": "https://api.synthetic.new/openai/v1", + "doc": "https://synthetic.new/pricing", + "models": [ { - "id": "gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "hf:deepseek-ai/DeepSeek-R1", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ "text" @@ -113428,34 +121830,41 @@ ] }, "limit": { - "context": 129000, - "output": 4096 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "Kimi-K2.5", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "hf:deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek R1 (0528)", + "display_name": "DeepSeek R1 (0528)", "modalities": { "input": [ "text" @@ -113465,13 +121874,14 @@ ] }, "limit": { - "context": 254000, - "output": 32768 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -113485,29 +121895,19 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "open_weights": false, + "release_date": "2025-08-01", + "last_updated": "2025-08-01", "cost": { - "input": 0.55, - "output": 2.75 + "input": 3, + "output": 8 }, "type": "chat" - } - ] - }, - "alibaba-coding-plan-cn": { - "id": "alibaba-coding-plan-cn", - "name": "Alibaba Coding Plan (China)", - "display_name": "Alibaba Coding Plan (China)", - "api": "https://coding.dashscope.aliyuncs.com/v1", - "doc": "https://help.aliyun.com/zh/model-studio/coding-plan", - "models": [ + }, { - "id": "qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "hf:deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ "text" @@ -113517,43 +121917,40 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "release_date": "2025-09-22", + "last_updated": "2025-09-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 1.2, + "output": 1.2 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "hf:deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -113561,34 +121958,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "attachment": false, + "open_weights": false, + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.56, + "output": 1.68 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "hf:deepseek-ai/DeepSeek-V3-0324", + "name": "DeepSeek V3 (0324)", + "display_name": "DeepSeek V3 (0324)", "modalities": { "input": [ "text" @@ -113598,43 +121981,28 @@ ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": false, + "release_date": "2025-08-01", + "last_updated": "2025-08-01", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 1.2, + "output": 1.2 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "hf:deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -113644,8 +122012,8 @@ ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 162816, + "output": 8000 }, "temperature": true, "tool_call": true, @@ -113655,31 +122023,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "open_weights": true, + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, + "input": 0.27, + "output": 0.4, + "cache_read": 0.27, "cache_write": 0 }, "type": "chat" }, { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "hf:deepseek-ai/DeepSeek-V3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ "text" @@ -113689,8 +122051,8 @@ ] }, "limit": { - "context": 196608, - "output": 24576 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -113698,46 +122060,32 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 1.25, + "output": 1.25 }, "type": "chat" }, { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "hf:moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -113757,25 +122105,24 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2025-11-07", + "last_updated": "2025-11-07", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "qwen3-max-2026-01-23", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "hf:moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -113783,12 +122130,13 @@ }, "limit": { "context": 262144, - "output": 32768 + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -113802,22 +122150,20 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-01-23", - "last_updated": "2026-01-23", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "qwen3-coder-next", - "name": "Qwen3 Coder Next", - "display_name": "Qwen3 Coder Next", + "id": "hf:moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -113828,7 +122174,7 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -113837,32 +122183,30 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-03", - "last_updated": "2026-02-03", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 1.2, + "output": 1.2 }, "type": "chat" }, { - "id": "qwen3.5-plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "hf:Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -113882,64 +122226,20 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, - "type": "chat" - } - ] - }, - "mistral": { - "id": "mistral", - "name": "Mistral", - "display_name": "Mistral", - "doc": "https://docs.mistral.ai/getting-started/models/", - "models": [ - { - "id": "mistral-small-latest", - "name": "Mistral Small (latest)", - "display_name": "Mistral Small (latest)", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 256000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.65, + "output": 3 }, "type": "chat" }, { - "id": "mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "hf:Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen 3 235B Instruct", + "display_name": "Qwen 3 235B Instruct", "modalities": { "input": [ "text" @@ -113949,8 +122249,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -113959,19 +122259,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-07-21", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "mistral-large-2512", - "name": "Mistral Large 3", - "display_name": "Mistral Large 3", + "id": "hf:Qwen/Qwen3.5-397B-A17B", + "name": "Qwen3.5-97B-A17B", + "display_name": "Qwen3.5-97B-A17B", "modalities": { "input": [ "text", @@ -113983,61 +122283,72 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2025-12-02", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.6, + "output": 3, + "cache_read": 0.6 }, "type": "chat" }, { - "id": "labs-devstral-small-2512", - "name": "Devstral Small 2", - "display_name": "Devstral Small 2", + "id": "hf:Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen2.5-Coder-32B-Instruct", + "display_name": "Qwen2.5-Coder-32B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "knowledge": "2024-10", + "release_date": "2024-11-11", + "last_updated": "2024-11-11", "cost": { - "input": 0, - "output": 0 + "input": 0.8, + "output": 0.8 }, "type": "chat" }, { - "id": "devstral-2512", - "name": "Devstral 2", - "display_name": "Devstral 2", + "id": "hf:Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen 3 Coder 480B", + "display_name": "Qwen 3 Coder 480B", "modalities": { "input": [ "text" @@ -114047,8 +122358,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -114057,19 +122368,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.4, + "input": 2, "output": 2 }, "type": "chat" }, { - "id": "magistral-medium-latest", - "name": "Magistral Medium (latest)", - "display_name": "Magistral Medium (latest)", + "id": "hf:openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -114080,7 +122391,7 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -114088,21 +122399,25 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-03-17", - "last_updated": "2025-03-20", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 2, - "output": 5 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "open-mixtral-8x7b", - "name": "Mixtral 8x7B", - "display_name": "Mixtral 8x7B", + "id": "hf:zai-org/GLM-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ "text" @@ -114112,62 +122427,85 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-01", - "release_date": "2023-12-11", - "last_updated": "2023-12-11", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.7, - "output": 0.7 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "pixtral-large-latest", - "name": "Pixtral Large (latest)", - "display_name": "Pixtral Large (latest)", + "id": "hf:zai-org/GLM-4.7-Flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 196608, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2024-11-04", + "release_date": "2026-01-18", + "last_updated": "2026-01-18", "cost": { - "input": 2, - "output": 6 + "input": 0.06, + "output": 0.4, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "mistral-large-2411", - "name": "Mistral Large 2.1", - "display_name": "Mistral Large 2.1", + "id": "hf:zai-org/GLM-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -114177,29 +122515,41 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 196608, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2024-11-04", + "release_date": "2026-02-12", + "last_updated": "2026-04-08", "cost": { - "input": 2, - "output": 6 + "input": 1, + "output": 3, + "cache_read": 1 }, "type": "chat" }, { - "id": "codestral-latest", - "name": "Codestral (latest)", - "display_name": "Codestral (latest)", + "id": "hf:zai-org/GLM-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ "text" @@ -114209,95 +122559,124 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 196608, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-05-29", - "last_updated": "2025-01-04", + "release_date": "2026-03-27", + "last_updated": "2026-04-12", "cost": { - "input": 0.3, - "output": 0.9 + "input": 1, + "output": 3, + "cache_read": 1 }, "type": "chat" }, { - "id": "mistral-large-latest", - "name": "Mistral Large (latest)", - "display_name": "Mistral Large (latest)", + "id": "hf:zai-org/GLM-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2025-12-02", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "mistral-small-2506", - "name": "Mistral Small 3.2", - "display_name": "Mistral Small 3.2", + "id": "hf:nvidia/NVIDIA-Nemotron-3-Super-120B-A12B-NVFP4", + "name": "Nemotron 3 Super 120B", + "display_name": "Nemotron 3 Super 120B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-06-20", - "last_updated": "2025-06-20", + "knowledge": "2024-04", + "release_date": "2026-03-11", + "last_updated": "2026-04-03", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.3, + "output": 1, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "pixtral-12b", - "name": "Pixtral 12B", - "display_name": "Pixtral 12B", + "id": "hf:nvidia/Kimi-K2.5-NVFP4", + "name": "Kimi K2.5 (NVFP4)", + "display_name": "Kimi K2.5 (NVFP4)", "modalities": { "input": [ "text", @@ -114308,29 +122687,41 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-09-01", - "last_updated": "2024-09-01", + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "ministral-8b-latest", - "name": "Ministral 8B (latest)", - "display_name": "Ministral 8B (latest)", + "id": "hf:MiniMaxAI/MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -114340,29 +122731,40 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-04", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "mistral-embed", - "name": "Mistral Embed", - "display_name": "Mistral Embed", + "id": "hf:MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -114372,28 +122774,41 @@ ] }, "limit": { - "context": 8000, - "output": 3072 + "context": 191488, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2023-12-11", - "last_updated": "2023-12-11", + "open_weights": true, + "release_date": "2026-02-07", + "last_updated": "2026-02-07", "cost": { - "input": 0.1, - "output": 0 + "input": 0.6, + "output": 3, + "cache_read": 0.6 }, "type": "chat" }, { - "id": "magistral-small", - "name": "Magistral Small", - "display_name": "Magistral Small", + "id": "hf:MiniMaxAI/MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ "text" @@ -114403,8 +122818,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 196608, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -114412,33 +122827,36 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-03-17", - "last_updated": "2025-03-17", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "mistral-small-2603", - "name": "Mistral Small 4", - "display_name": "Mistral Small 4", + "id": "hf:meta-llama/Llama-3.1-8B-Instruct", + "name": "Llama-3.1-8B-Instruct", + "display_name": "Llama-3.1-8B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -114446,53 +122864,54 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "ministral-3b-latest", - "name": "Ministral 3B (latest)", - "display_name": "Ministral 3B (latest)", + "id": "hf:meta-llama/Llama-4-Scout-17B-16E-Instruct", + "name": "Llama-4-Scout-17B-16E-Instruct", + "display_name": "Llama-4-Scout-17B-16E-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 328000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-04", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.04, - "output": 0.04 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "open-mixtral-8x22b", - "name": "Mixtral 8x22B", - "display_name": "Mixtral 8x22B", + "id": "hf:meta-llama/Llama-3.1-70B-Instruct", + "name": "Llama-3.1-70B-Instruct", + "display_name": "Llama-3.1-70B-Instruct", "modalities": { "input": [ "text" @@ -114502,41 +122921,41 @@ ] }, "limit": { - "context": 64000, - "output": 64000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-04-17", - "last_updated": "2024-04-17", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 2, - "output": 6 + "input": 0.9, + "output": 0.9 }, "type": "chat" }, { - "id": "mistral-medium-2604", - "name": "Mistral Medium 3.5", - "display_name": "Mistral Medium 3.5", + "id": "hf:meta-llama/Llama-3.1-405B-Instruct", + "name": "Llama-3.1-405B-Instruct", + "display_name": "Llama-3.1-405B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -114544,20 +122963,21 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-29", - "last_updated": "2026-04-29", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 1.5, - "output": 7.5 + "input": 3, + "output": 3 }, "type": "chat" }, { - "id": "devstral-small-2505", - "name": "Devstral Small 2505", - "display_name": "Devstral Small 2505", + "id": "hf:meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -114568,95 +122988,120 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.9, + "output": 0.9 }, "type": "chat" }, { - "id": "devstral-medium-2507", - "name": "Devstral Medium", - "display_name": "Devstral Medium", + "id": "hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", + "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 524000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-07-10", - "last_updated": "2025-07-10", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.4, - "output": 2 + "input": 0.22, + "output": 0.88 }, "type": "chat" }, { - "id": "open-mistral-7b", - "name": "Mistral 7B", - "display_name": "Mistral 7B", + "id": "hf:moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8000, - "output": 8000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2023-09-27", - "last_updated": "2023-09-27", + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.25, - "output": 0.25 + "input": 0.95, + "output": 4, + "cache_read": 0.95 }, "type": "chat" - }, + } + ] + }, + "azure": { + "id": "azure", + "name": "Azure", + "display_name": "Azure", + "doc": "https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models", + "models": [ { - "id": "devstral-medium-latest", - "name": "Devstral 2 (latest)", - "display_name": "Devstral 2 (latest)", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -114669,56 +123114,77 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "knowledge": "2025-01", + "release_date": "2026-02-06", + "last_updated": "2026-02-06", "cost": { - "input": 0.4, - "output": 2 + "input": 0.6, + "output": 3 }, "type": "chat" }, { - "id": "mistral-medium-2505", - "name": "Mistral Medium 3", - "display_name": "Mistral Medium 3", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "knowledge": "2025-02-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.4, - "output": 2 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "devstral-small-2507", - "name": "Devstral Small", - "display_name": "Devstral Small", + "id": "text-embedding-3-large", + "name": "text-embedding-3-large", + "display_name": "text-embedding-3-large", "modalities": { "input": [ "text" @@ -114728,104 +123194,92 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8191, + "output": 3072 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-07-10", - "last_updated": "2025-07-10", + "open_weights": false, + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.13, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "mistral-medium-2508", - "name": "Mistral Medium 3.1", - "display_name": "Mistral Medium 3.1", + "id": "mistral-large-2411", + "name": "Mistral Large 24.11", + "display_name": "Mistral Large 24.11", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-08-12", - "last_updated": "2025-08-12", + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.4, - "output": 2 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "mistral-medium-latest", - "name": "Mistral Medium (latest)", - "display_name": "Mistral Medium (latest)", + "id": "phi-4-reasoning-plus", + "name": "Phi-4-reasoning-plus", + "display_name": "Phi-4-reasoning-plus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 32000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-29", - "last_updated": "2026-04-29", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 1.5, - "output": 7.5 + "input": 0.125, + "output": 0.5 }, "type": "chat" - } - ] - }, - "ovhcloud": { - "id": "ovhcloud", - "name": "OVHcloud AI Endpoints", - "display_name": "OVHcloud AI Endpoints", - "api": "https://oai.endpoints.kepler.ai.cloud.ovh.net/v1", - "doc": "https://www.ovhcloud.com/en/public-cloud/ai-endpoints/catalog//", - "models": [ + }, { - "id": "meta-llama-3_3-70b-instruct", - "name": "Meta-Llama-3_3-70B-Instruct", - "display_name": "Meta-Llama-3_3-70B-Instruct", + "id": "gpt-3.5-turbo-0301", + "name": "GPT-3.5 Turbo 0301", + "display_name": "GPT-3.5 Turbo 0301", "modalities": { "input": [ "text" @@ -114835,59 +123289,64 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 4096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-01", - "last_updated": "2025-04-01", + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2023-03-01", + "last_updated": "2023-03-01", "cost": { - "input": 0.74, - "output": 0.74 + "input": 1.5, + "output": 2 }, "type": "chat" }, { - "id": "mistral-7b-instruct-v0.3", - "name": "Mistral-7B-Instruct-v0.3", - "display_name": "Mistral-7B-Instruct-v0.3", + "id": "phi-4-multimodal", + "name": "Phi-4-multimodal", + "display_name": "Phi-4-multimodal", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-04-01", - "last_updated": "2025-04-01", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.11, - "output": 0.11 + "input": 0.08, + "output": 0.32, + "input_audio": 4 }, "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3-32B", - "display_name": "Qwen3-32B", + "id": "meta-llama-3.1-405b-instruct", + "name": "Meta-Llama-3.1-405B-Instruct", + "display_name": "Meta-Llama-3.1-405B-Instruct", "modalities": { "input": [ "text" @@ -114897,40 +123356,29 @@ ] }, "limit": { - "context": 32768, + "context": 128000, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-07-16", - "last_updated": "2025-07-16", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.09, - "output": 0.25 + "input": 5.33, + "output": 16 }, "type": "chat" }, { - "id": "qwen2.5-vl-72b-instruct", - "name": "Qwen2.5-VL-72B-Instruct", - "display_name": "Qwen2.5-VL-72B-Instruct", + "id": "gpt-4-turbo-vision", + "name": "GPT-4 Turbo Vision", + "display_name": "GPT-4 Turbo Vision", "modalities": { "input": [ "text", @@ -114941,59 +123389,86 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-31", - "last_updated": "2025-03-31", + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 1.01, - "output": 1.01 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3-Coder-30B-A3B-Instruct", - "display_name": "Qwen3-Coder-30B-A3B-Instruct", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-10-28", - "last_updated": "2025-10-28", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.07, - "output": 0.26 + "input": 1.75, + "output": 14, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "gpt-oss-20b", - "name": "gpt-oss-20b", - "display_name": "gpt-oss-20b", + "id": "gpt-3.5-turbo-0125", + "name": "GPT-3.5 Turbo 0125", + "display_name": "GPT-3.5 Turbo 0125", "modalities": { "input": [ "text" @@ -115003,82 +123478,78 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 16384, + "output": 16384 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0.05, - "output": 0.18 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "mistral-small-3.2-24b-instruct-2506", - "name": "Mistral-Small-3.2-24B-Instruct-2506", - "display_name": "Mistral-Small-3.2-24B-Instruct-2506", + "id": "meta-llama-3.1-70b-instruct", + "name": "Meta-Llama-3.1-70B-Instruct", + "display_name": "Meta-Llama-3.1-70B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-07-16", - "last_updated": "2025-07-16", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.1, - "output": 0.31 + "input": 2.68, + "output": 3.54 }, "type": "chat" }, { - "id": "qwen3.5-9b", - "name": "Qwen3.5-9B", - "display_name": "Qwen3.5-9B", + "id": "deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 163840, + "output": 163840 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -115091,56 +123562,54 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-02-15", - "last_updated": "2026-02-15", + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.1, - "output": 0.15 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.09, - "output": 0.47 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "mistral-nemo-instruct-2407", - "name": "Mistral-Nemo-Instruct-2407", - "display_name": "Mistral-Nemo-Instruct-2407", + "id": "o1-preview", + "name": "o1-preview", + "display_name": "o1-preview", "modalities": { "input": [ "text" @@ -115150,28 +123619,45 @@ ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 128000, + "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "release_date": "2024-11-20", - "last_updated": "2024-11-20", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 0.14, - "output": 0.14 + "input": 16.5, + "output": 66, + "cache_read": 8.25 }, "type": "chat" }, { - "id": "llama-3.1-8b-instruct", - "name": "Llama-3.1-8B-Instruct", - "display_name": "Llama-3.1-8B-Instruct", + "id": "text-embedding-ada-002", + "name": "text-embedding-ada-002", + "display_name": "text-embedding-ada-002", "modalities": { "input": [ "text" @@ -115181,79 +123667,95 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-06-11", - "last_updated": "2025-06-11", + "open_weights": false, + "release_date": "2022-12-15", + "last_updated": "2022-12-15", "cost": { - "input": 0.11, - "output": 0.11 + "input": 0.1, + "output": 0 }, - "type": "chat" - } - ] - }, - "friendli": { - "id": "friendli", - "name": "Friendli", - "display_name": "Friendli", - "api": "https://api.friendli.ai/serverless/v1", - "doc": "https://friendli.ai/docs/guides/serverless_endpoints/introduction", - "models": [ + "type": "embedding" + }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex Mini", + "display_name": "GPT-5.1 Codex Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-29", - "last_updated": "2026-01-29", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "grok-4-1-fast-reasoning", + "name": "Grok 4.1 Fast (Reasoning)", + "display_name": "Grok 4.1 Fast (Reasoning)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 202752 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -115263,30 +123765,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-07", - "last_updated": "2026-04-07", + "attachment": true, + "open_weights": false, + "release_date": "2025-06-27", + "last_updated": "2025-06-27", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "zai-org/GLM-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "deepseek-r1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ "text" @@ -115296,8 +123792,8 @@ ] }, "limit": { - "context": 202752, - "output": 202752 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, @@ -115318,19 +123814,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.5 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "deepseek-v3-0324", + "name": "DeepSeek-V3-0324", + "display_name": "DeepSeek-V3-0324", "modalities": { "input": [ "text" @@ -115350,18 +123846,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-08-01", - "last_updated": "2025-12-23", + "knowledge": "2024-07", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 0.6, - "output": 0.6 + "input": 1.14, + "output": 4.56 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.1-8B-Instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "cohere-embed-v3-multilingual", + "name": "Embed v3 Multilingual", + "display_name": "Embed v3 Multilingual", "modalities": { "input": [ "text" @@ -115371,28 +123868,28 @@ ] }, "limit": { - "context": 131072, - "output": 8000 + "context": 512, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-08-01", - "last_updated": "2025-12-23", + "release_date": "2023-11-07", + "last_updated": "2023-11-07", "cost": { "input": 0.1, - "output": 0.1 + "output": 0 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "deepseek-v3.2-speciale", + "name": "DeepSeek-V3.2-Speciale", + "display_name": "DeepSeek-V3.2-Speciale", "modalities": { "input": [ "text" @@ -115402,50 +123899,30 @@ ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 128000, + "output": 128000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.58, + "output": 1.68 }, "type": "chat" - } - ] - }, - "cortecs": { - "id": "cortecs", - "name": "Cortecs", - "display_name": "Cortecs", - "api": "https://api.cortecs.ai/v1", - "doc": "https://api.cortecs.ai/v1/models", - "models": [ - { - "id": "minimax-m2.7", - "name": "MiniMax-m2.7", - "display_name": "MiniMax-m2.7", + }, + { + "id": "phi-3-medium-128k-instruct", + "name": "Phi-3-medium-instruct (128k)", + "display_name": "Phi-3-medium-instruct (128k)", "modalities": { "input": [ "text" @@ -115455,80 +123932,61 @@ ] }, "limit": { - "context": 202752, - "output": 196072 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.47, - "output": 1.4 + "input": 0.17, + "output": 0.68 }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "codestral-2501", + "name": "Codestral 25.01", + "display_name": "Codestral 25.01", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2024-03", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.09, - "output": 5.43 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "deepseek-v3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ "text" @@ -115538,8 +123996,8 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -115547,67 +124005,59 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.062, - "output": 0.408 + "input": 0.58, + "output": 1.68 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "grok-4-1-fast-non-reasoning", + "name": "Grok 4.1 Fast (Non-Reasoning)", + "display_name": "Grok 4.1 Fast (Non-Reasoning)", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "attachment": true, + "open_weights": false, + "release_date": "2025-06-27", + "last_updated": "2025-06-27", "cost": { - "input": 0.55, - "output": 2.76 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "deepseek-v3-0324", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "phi-3-medium-4k-instruct", + "name": "Phi-3-medium-instruct (4k)", + "display_name": "Phi-3-medium-instruct (4k)", "modalities": { "input": [ "text" @@ -115617,29 +124067,29 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 4096, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.551, - "output": 1.654 + "input": 0.17, + "output": 0.68 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "phi-4", + "name": "Phi-4", + "display_name": "Phi-4", "modalities": { "input": [ "text" @@ -115649,41 +124099,29 @@ ] }, "limit": { - "context": 198000, - "output": 198000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.45, - "output": 2.23 + "input": 0.125, + "output": 0.5 }, "type": "chat" }, { - "id": "claude-opus4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", @@ -115695,32 +124133,37 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2025-07-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 5.6, - "output": 27.99, - "cache_read": 0.56, - "cache_write": 6.99 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM 5", - "display_name": "GLM 5", + "id": "mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -115730,73 +124173,61 @@ ] }, "limit": { - "context": 202752, - "output": 202752 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 1.08, - "output": 3.44 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "nova-pro-v1", - "name": "Nova Pro 1.0", - "display_name": "Nova Pro 1.0", + "id": "phi-3-mini-128k-instruct", + "name": "Phi-3-mini-instruct (128k)", + "display_name": "Phi-3-mini-instruct (128k)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 5000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 1.016, - "output": 4.061 + "input": 0.13, + "output": 0.52 }, "type": "chat" }, { - "id": "devstral-2512", - "name": "Devstral 2 2512", - "display_name": "Devstral 2 2512", + "id": "gpt-3.5-turbo-instruct", + "name": "GPT-3.5 Turbo Instruct", + "display_name": "GPT-3.5 Turbo Instruct", "modalities": { "input": [ "text" @@ -115806,72 +124237,85 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 4096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2023-09-21", + "last_updated": "2023-09-21", "cost": { - "input": 0, - "output": 0 + "input": 1.5, + "output": 2 }, "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.099, - "output": 0.33 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "codestral-2508", - "name": "Codestral 2508", - "display_name": "Codestral 2508", + "id": "phi-4-reasoning", + "name": "Phi-4-reasoning", + "display_name": "Phi-4-reasoning", "modalities": { "input": [ "text" @@ -115881,45 +124325,47 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 32000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.3, - "output": 0.9, - "cache_read": 0.03 + "input": 0.125, + "output": 0.5 }, "type": "chat" }, { - "id": "claude-4-5-sonnet", - "name": "Claude 4.5 Sonnet", - "display_name": "Claude 4.5 Sonnet", + "id": "gpt-5.1-chat", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", "modalities": { "input": [ "text", "image", - "pdf" + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -115927,19 +124373,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 3.259, - "output": 16.296 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "phi-3-small-128k-instruct", + "name": "Phi-3-small-instruct (128k)", + "display_name": "Phi-3-small-instruct (128k)", "modalities": { "input": [ "text" @@ -115949,29 +124396,60 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-07-11", - "last_updated": "2025-09-05", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.551, - "output": 2.646 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "nemotron-3-super-120b-a12b", - "name": "Nemotron 3 Super 120B A12B", - "display_name": "Nemotron 3 Super 120B A12B", + "id": "model-router", + "name": "Model Router", + "display_name": "Model Router", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-05-19", + "last_updated": "2025-11-18", + "cost": { + "input": 0.14, + "output": 0 + }, + "type": "chat" + }, + { + "id": "phi-3-small-8k-instruct", + "name": "Phi-3-small-instruct (8k)", + "display_name": "Phi-3-small-instruct (8k)", "modalities": { "input": [ "text" @@ -115981,30 +124459,29 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-03-11", - "last_updated": "2026-03-11", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.266, - "output": 0.799 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "minimax-m2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "phi-3.5-moe-instruct", + "name": "Phi-3.5-MoE-instruct", + "display_name": "Phi-3.5-MoE-instruct", "modalities": { "input": [ "text" @@ -116014,129 +124491,91 @@ ] }, "limit": { - "context": 400000, - "output": 400000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.39, - "output": 1.57 + "input": 0.16, + "output": 0.64 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "phi-3.5-mini-instruct", + "name": "Phi-3.5-mini-instruct", + "display_name": "Phi-3.5-mini-instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-17", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 1.654, - "output": 11.024 + "input": 0.13, + "output": 0.52 }, "type": "chat" }, { - "id": "claude-opus4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "text-embedding-3-small", + "name": "text-embedding-3-small", + "display_name": "text-embedding-3-small", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 8191, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 5.98, - "output": 29.89 + "input": 0.02, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "devstral-small-2512", - "name": "Devstral Small 2 2512", - "display_name": "Devstral Small 2 2512", + "id": "llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "display_name": "Llama 4 Scout 17B 16E Instruct", "modalities": { "input": [ "text", @@ -116147,83 +124586,75 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0, - "output": 0 + "input": 0.2, + "output": 0.78 }, "type": "chat" }, { - "id": "minimax-m2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "mistral-small-2503", + "name": "Mistral Small 3.1", + "display_name": "Mistral Small 3.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 196000, - "output": 196000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 0.34, - "output": 1.34 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "claude-opus-4-1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -116233,30 +124664,26 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-14", - "last_updated": "2026-04-14", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 1.31, - "output": 4.1, - "cache_read": 0.24 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "glm-4.5", - "name": "GLM 4.5", - "display_name": "GLM 4.5", + "id": "meta-llama-3-70b-instruct", + "name": "Meta-Llama-3-70B-Instruct", + "display_name": "Meta-Llama-3-70B-Instruct", "modalities": { "input": [ "text" @@ -116266,123 +124693,134 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 0.67, - "output": 2.46 + "input": 2.68, + "output": 3.54 }, "type": "chat" }, { - "id": "claude-opus4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "gpt-3.5-turbo-1106", + "name": "GPT-3.5 Turbo 1106", + "display_name": "GPT-3.5 Turbo 1106", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "knowledge": "2021-08", + "release_date": "2023-11-06", + "last_updated": "2023-11-06", "cost": { - "input": 5.98, - "output": 29.89 + "input": 1, + "output": 2 }, "type": "chat" }, { - "id": "claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ "text", "image", - "pdf" + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 3.307, - "output": 16.536 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 272000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -116391,29 +124829,40 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-11", - "last_updated": "2025-09-11", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.164, - "output": 1.311 + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "mai-ds-r1", + "name": "MAI-DS-R1", + "display_name": "MAI-DS-R1", "modalities": { "input": [ "text" @@ -116423,42 +124872,41 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-01", - "last_updated": "2025-08-01", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.22, - "output": 1.34 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -116479,67 +124927,66 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-12-02", "cost": { - "input": 0.81, - "output": 3.54, - "cache_read": 0.2 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "qwen3-coder-next", - "name": "Qwen3 Coder Next 80B", - "display_name": "Qwen3 Coder Next 80B", + "id": "llama-3.2-90b-vision-instruct", + "name": "Llama-3.2-90B-Vision-Instruct", + "display_name": "Llama-3.2-90B-Vision-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-04", - "last_updated": "2026-02-04", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.158, - "output": 0.84 + "input": 2.04, + "output": 2.04 }, "type": "chat" }, { - "id": "claude-4-6-sonnet", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "codex-mini", + "name": "Codex Mini", + "display_name": "Codex Mini", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -116547,51 +124994,69 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "knowledge": "2024-04", + "release_date": "2025-05-16", + "last_updated": "2025-05-16", "cost": { - "input": 3.59, - "output": 17.92 + "input": 1.5, + "output": 6, + "cache_read": 0.375 }, "type": "chat" }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 0.441, - "output": 1.984 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "mixtral-8x7B-instruct-v0.1", - "name": "Mixtral 8x7B Instruct v0.1", - "display_name": "Mixtral 8x7B Instruct v0.1", + "id": "cohere-embed-v3-english", + "name": "Embed v3 English", + "display_name": "Embed v3 English", "modalities": { "input": [ "text" @@ -116601,30 +125066,28 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 512, + "output": 1024 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-09", - "release_date": "2023-12-11", - "last_updated": "2023-12-11", + "release_date": "2023-11-07", + "last_updated": "2023-11-07", "cost": { - "input": 0.438, - "output": 0.68 + "input": 0.1, + "output": 0 }, "type": "chat" }, { - "id": "hermes-4-70b", - "name": "Hermes 4 70B", - "display_name": "Hermes 4 70B", + "id": "gpt-3.5-turbo-0613", + "name": "GPT-3.5 Turbo 0613", + "display_name": "GPT-3.5 Turbo 0613", "modalities": { "input": [ "text" @@ -116634,30 +125097,29 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2023-06-13", + "last_updated": "2023-06-13", "cost": { - "input": 0.116, - "output": 0.358 + "input": 3, + "output": 4 }, "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "deepseek-v3.1", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ "text" @@ -116667,8 +125129,8 @@ ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -116676,31 +125138,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2024-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.32, - "output": 1.18 + "input": 0.56, + "output": 1.68 }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "cohere-command-a", + "name": "Command A", + "display_name": "Command A", "modalities": { "input": [ "text" @@ -116710,8 +125162,8 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 256000, + "output": 8000 }, "temperature": true, "tool_call": true, @@ -116719,29 +125171,25 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2024-06-01", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 0.266, - "output": 0.444 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "intellect-3", - "name": "INTELLECT 3", - "display_name": "INTELLECT 3", + "id": "mistral-medium-2505", + "name": "Mistral Medium 3", + "display_name": "Mistral Medium 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -116754,24 +125202,23 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-11", - "release_date": "2025-11-26", - "last_updated": "2025-11-26", + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0.219, - "output": 1.202 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "glm-4.7-flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "gpt-4-32k", + "name": "GPT-4 32K", + "display_name": "GPT-4 32K", "modalities": { "input": [ "text" @@ -116781,41 +125228,29 @@ ] }, "limit": { - "context": 203000, - "output": 203000 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", "cost": { - "input": 0.09, - "output": 0.53 + "input": 60, + "output": 120 }, "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "GPT Oss 120b", - "display_name": "GPT Oss 120b", + "id": "meta-llama-3-8b-instruct", + "name": "Meta-Llama-3-8B-Instruct", + "display_name": "Meta-Llama-3-8B-Instruct", "modalities": { "input": [ "text" @@ -116825,34 +125260,29 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-01", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 0.61 }, "type": "chat" }, { - "id": "qwen-2.5-72b-instruct", - "name": "Qwen2.5 72B Instruct", - "display_name": "Qwen2.5 72B Instruct", + "id": "ministral-3b", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ "text" @@ -116862,8 +125292,8 @@ ] }, "limit": { - "context": 33000, - "output": 33000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -116872,96 +125302,84 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06", - "release_date": "2024-09-19", - "last_updated": "2024-09-19", + "knowledge": "2024-03", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.062, - "output": 0.231 + "input": 0.04, + "output": 0.04 }, "type": "chat" }, { - "id": "deepseek-r1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", + "id": "llama-3.2-11b-vision-instruct", + "name": "Llama-3.2-11B-Vision-Instruct", + "display_name": "Llama-3.2-11B-Vision-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.585, - "output": 2.307 + "input": 0.37, + "output": 0.37 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "GPT 4.1", - "display_name": "GPT 4.1", + "id": "phi-3-mini-4k-instruct", + "name": "Phi-3-mini-instruct (4k)", + "display_name": "Phi-3-mini-instruct (4k)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 4096, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 2.354, - "output": 9.417 + "input": 0.13, + "output": 0.52 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ "text" @@ -116971,86 +125389,102 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "attachment": false, + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", "cost": { - "input": 0.656, - "output": 2.731 + "input": 60, + "output": 120 }, "type": "chat" }, { - "id": "llama-3.1-405b-instruct", - "name": "Llama 3.1 405B Instruct", - "display_name": "Llama 3.1 405B Instruct", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 128000, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen3.5-122b-a10b", - "name": "Qwen3.5 122B A10B", - "display_name": "Qwen3.5 122B A10B", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -117059,29 +125493,40 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 0.444, - "output": 3.106 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "phi-4-mini", + "name": "Phi-4-mini", + "display_name": "Phi-4-mini", "modalities": { "input": [ "text" @@ -117091,30 +125536,29 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.089, - "output": 0.275 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "mistral-large-2512", - "name": "Mistral Large 3 2512", - "display_name": "Mistral Large 3 2512", + "id": "gpt-5-chat", + "name": "GPT-5 Chat", + "display_name": "GPT-5 Chat", "modalities": { "input": [ "text", @@ -117125,30 +125569,31 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "open_weights": false, + "knowledge": "2024-10-24", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.5, - "output": 1.5, - "cache_read": 0.05 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "qwen3.5-397b-a17b", - "name": "Qwen3.5 397B A17B", - "display_name": "Qwen3.5 397B A17B", + "id": "meta-llama-3.1-8b-instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" @@ -117158,54 +125603,43 @@ ] }, "limit": { - "context": 250000, - "output": 250000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.6, - "output": 3.6 + "input": 0.3, + "output": 0.61 }, "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 384000 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -117214,43 +125648,54 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.133, - "output": 0.266, - "cache_read": 0.028 + "input": 0.25, + "output": 2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 384000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -117259,72 +125704,75 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 1.553, - "output": 3.106, - "cache_read": 0.145 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "gpt-5.2-chat", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-31", - "last_updated": "2025-07-31", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.053, - "output": 0.222 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" - } - ] - }, - "siliconflow-com": { - "id": "siliconflow-com", - "name": "SiliconFlow", - "display_name": "SiliconFlow", - "api": "https://api.siliconflow.com/v1", - "doc": "https://cloud.siliconflow.com/models", - "models": [ + }, { - "id": "nex-agi/DeepSeek-V3.1-Nex-N1", - "name": "nex-agi/DeepSeek-V3.1-Nex-N1", - "display_name": "nex-agi/DeepSeek-V3.1-Nex-N1", + "id": "grok-4-20-reasoning", + "name": "Grok 4.20 (Reasoning)", + "display_name": "Grok 4.20 (Reasoning)", "modalities": { "input": [ "text" @@ -117334,8 +125782,8 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 262000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -117343,96 +125791,107 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-11-25", - "cost": { - "input": 0.5, - "output": 2 - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen2.5-VL-72B-Instruct", - "name": "Qwen/Qwen2.5-VL-72B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-72B-Instruct", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131000, - "output": 4000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true + } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-01-28", - "last_updated": "2025-11-25", + "knowledge": "2025-09", + "release_date": "2026-04-08", + "last_updated": "2026-04-08", "cost": { - "input": 0.59, - "output": 0.59 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-32B-Thinking", - "name": "Qwen/Qwen3-VL-32B-Thinking", - "display_name": "Qwen/Qwen3-VL-32B-Thinking", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-21", - "last_updated": "2025-11-25", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.2, - "output": 1.5 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "tiers": [ + { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5 + } }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", - "name": "Qwen/Qwen3-30B-A3B-Thinking-2507", - "display_name": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -117442,44 +125901,32 @@ ] }, "limit": { - "context": 262000, - "output": 131000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-31", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.09, - "output": 0.3 + "input": 0.71, + "output": 0.71 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-235B-A22B-Thinking", - "name": "Qwen/Qwen3-VL-235B-A22B-Thinking", - "display_name": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "id": "grok-4-20-non-reasoning", + "name": "Grok 4.20 (Non-Reasoning)", + "display_name": "Grok 4.20 (Non-Reasoning)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -117487,39 +125934,33 @@ }, "limit": { "context": 262000, - "output": 262000 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "knowledge": "2025-09", + "release_date": "2026-04-08", + "last_updated": "2026-04-08", "cost": { - "input": 0.45, - "output": 3.5 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-7B-Instruct", - "name": "Qwen/Qwen2.5-7B-Instruct", - "display_name": "Qwen/Qwen2.5-7B-Instruct", + "id": "o1-mini", + "name": "o1-mini", + "display_name": "o1-mini", "modalities": { "input": [ "text" @@ -117529,59 +125970,77 @@ ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 128000, + "output": 65536 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 0.05, - "output": 0.05 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-Coder-32B-Instruct", - "name": "Qwen/Qwen2.5-Coder-32B-Instruct", - "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "id": "cohere-embed-v-4-0", + "name": "Embed v4", + "display_name": "Embed v4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 128000, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2024-11-11", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.18, - "output": 0.18 + "input": 0.12, + "output": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", - "name": "Qwen/Qwen3-VL-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "id": "gpt-5.3-chat", + "name": "GPT-5.3 Chat", + "display_name": "GPT-5.3 Chat", "modalities": { "input": [ "text", @@ -117592,28 +126051,31 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-10-05", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.29, - "output": 1 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "Qwen/QwQ-32B", - "name": "Qwen/QwQ-32B", - "display_name": "Qwen/QwQ-32B", + "id": "phi-4-mini-reasoning", + "name": "Phi-4-mini-reasoning", + "display_name": "Phi-4-mini-reasoning", "modalities": { "input": [ "text" @@ -117623,8 +126085,8 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -117632,116 +126094,114 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "release_date": "2025-03-06", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.15, - "output": 0.58 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B", - "name": "Qwen/Qwen3-235B-A22B", - "display_name": "Qwen/Qwen3-235B-A22B", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "interleaved": true } }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.35, - "output": 1.42 + "input": 0.95, + "output": 4 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Captioner", - "name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "id": "grok-4-fast-reasoning", + "name": "Grok 4 Fast (Reasoning)", + "display_name": "Grok 4 Fast (Reasoning)", "modalities": { "input": [ - "audio" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 66000, - "output": 66000 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", - "cost": { - "input": 0.1, - "output": 0.4 + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-8B-Thinking", - "name": "Qwen/Qwen3-VL-8B-Thinking", - "display_name": "Qwen/Qwen3-VL-8B-Thinking", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -117751,29 +126211,26 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "cost": { - "input": 0.18, - "output": 2 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-7B-Instruct", - "name": "Qwen/Qwen2.5-VL-7B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-7B-Instruct", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", @@ -117784,101 +126241,144 @@ ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-01-28", - "last_updated": "2025-11-25", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.05, - "output": 0.05 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 0.14, - "output": 1.4 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "Qwen/Qwen3-8B", - "name": "Qwen/Qwen3-8B", - "display_name": "Qwen/Qwen3-8B", + "id": "gpt-5.4-nano", + "name": "GPT-5.4 Nano", + "display_name": "GPT-5.4 Nano", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.06, - "output": 0.06 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "display_name": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "id": "cohere-command-r-plus-08-2024", + "name": "Command R+", + "display_name": "Command R+", "modalities": { "input": [ "text" @@ -117888,8 +126388,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, @@ -117897,136 +126397,178 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-30", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0.09, - "output": 0.3 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "display_name": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-23", - "last_updated": "2025-11-25", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.09, - "output": 0.6 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "Qwen/Qwen3-32B", - "name": "Qwen/Qwen3-32B", - "display_name": "Qwen/Qwen3-32B", + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.14, - "output": 0.57 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", - "name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "id": "gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 400000, + "output": 272000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-01", - "last_updated": "2025-11-25", + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 0.07, - "output": 0.28 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Instruct", - "name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "id": "gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 66000, - "output": 66000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -118035,122 +126577,161 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "Qwen/Qwen3-14B", - "name": "Qwen/Qwen3-14B", - "display_name": "Qwen/Qwen3-14B", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.07, - "output": 0.28 + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + }, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-72B-Instruct-128K", - "name": "Qwen/Qwen2.5-72B-Instruct-128K", - "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", + "id": "gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 4000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.59, - "output": 0.59 + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-32B-Instruct", - "name": "Qwen/Qwen2.5-32B-Instruct", - "display_name": "Qwen/Qwen2.5-32B-Instruct", + "id": "gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-09-19", - "last_updated": "2025-11-25", + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0.18, - "output": 0.18 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "id": "cohere-command-r-08-2024", + "name": "Command R", + "display_name": "Command R", "modalities": { "input": [ "text" @@ -118160,85 +126741,87 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0.13, + "input": 0.15, "output": 0.6 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Thinking", - "name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "id": "gpt-5.4-mini", + "name": "GPT-5.4 Mini", + "display_name": "GPT-5.4 Mini", "modalities": { "input": [ "text", "image", - "audio" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 66000, - "output": 66000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-32B-Instruct", - "name": "Qwen/Qwen2.5-VL-32B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-32B-Instruct", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ "text", @@ -118249,41 +126832,67 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-03-24", - "last_updated": "2025-11-25", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.27, - "output": 0.27 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "name": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "display_name": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "id": "gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -118292,28 +126901,56 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-11-25", + "knowledge": "2025-12-01", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.14, - "output": 0.57 + "input": 5, + "output": 30, + "cache_read": 0.5, + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + }, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "id": "gpt-5.4-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ "text", @@ -118324,59 +126961,98 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.3, - "output": 1.5 + "input": 30, + "output": 180, + "context_over_200k": { + "input": 60, + "output": 270 + }, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ] }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-14B-Instruct", - "name": "Qwen/Qwen2.5-14B-Instruct", - "display_name": "Qwen/Qwen2.5-14B-Instruct", + "id": "gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { "input": 0.1, - "output": 0.1 + "output": 0.4, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-30B-A3B-Thinking", - "name": "Qwen/Qwen3-VL-30B-A3B-Thinking", - "display_name": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ "text", @@ -118387,10 +127063,10 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -118399,60 +127075,81 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-11", - "last_updated": "2025-11-25", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.29, - "output": 1 + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-32B-Instruct", - "name": "Qwen/Qwen3-VL-32B-Instruct", - "display_name": "Qwen/Qwen3-VL-32B-Instruct", + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-10-21", - "last_updated": "2025-11-25", + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 0.2, - "output": 0.6 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-8B-Instruct", - "name": "Qwen/Qwen3-VL-8B-Instruct", - "display_name": "Qwen/Qwen3-VL-8B-Instruct", + "id": "o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ "text", @@ -118463,28 +127160,54 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.18, - "output": 0.68 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" - }, + } + ] + }, + "minimax-coding-plan": { + "id": "minimax-coding-plan", + "name": "MiniMax Token Plan (minimax.io)", + "display_name": "MiniMax Token Plan (minimax.io)", + "api": "https://api.minimax.io/anthropic/v1", + "doc": "https://platform.minimax.io/docs/token-plan/intro", + "models": [ { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "display_name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -118494,59 +127217,34 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-07-31", - "last_updated": "2025-11-25", - "cost": { - "input": 0.25, - "output": 1 - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen2.5-72B-Instruct", - "name": "Qwen/Qwen2.5-72B-Instruct", - "display_name": "Qwen/Qwen2.5-72B-Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 33000, - "output": 4000 + "supported": true, + "default": true }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.59, - "output": 0.59 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "stepfun-ai/Step-3.5-Flash", - "name": "stepfun-ai/Step-3.5-Flash", - "display_name": "stepfun-ai/Step-3.5-Flash", + "id": "MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ "text" @@ -118556,8 +127254,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -118565,20 +127263,33 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5", - "name": "zai-org/GLM-4.5", - "display_name": "zai-org/GLM-4.5", + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -118588,39 +127299,46 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.4, - "output": 2 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "zai-org/GLM-5V-Turbo", - "name": "zai-org/GLM-5V-Turbo", - "display_name": "zai-org/GLM-5V-Turbo", + "id": "MiniMax-M2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 204800, "output": 131072 }, "temperature": true, @@ -118640,21 +127358,22 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1.2, - "output": 4, + "input": 0, + "output": 0, + "cache_read": 0, "cache_write": 0 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7", - "name": "zai-org/GLM-4.7", - "display_name": "zai-org/GLM-4.7", + "id": "MiniMax-M2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "display_name": "MiniMax-M2.5-highspeed", "modalities": { "input": [ "text" @@ -118664,8 +127383,8 @@ ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -118675,29 +127394,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": true, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1", - "name": "zai-org/GLM-5.1", - "display_name": "zai-org/GLM-5.1", + "id": "MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ "text" @@ -118707,8 +127422,8 @@ ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 196608, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -118718,30 +127433,32 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 1.4, - "output": 4.4, - "cache_write": 0 + "input": 0, + "output": 0 }, "type": "chat" - }, - { - "id": "zai-org/GLM-4.5-Air", - "name": "zai-org/GLM-4.5-Air", - "display_name": "zai-org/GLM-4.5-Air", + } + ] + }, + "upstage": { + "id": "upstage", + "name": "Upstage", + "display_name": "Upstage", + "api": "https://api.upstage.ai/v1/solar", + "doc": "https://developers.upstage.ai/docs/apis/chat", + "models": [ + { + "id": "solar-pro2", + "name": "solar-pro2", + "display_name": "solar-pro2", "modalities": { "input": [ "text" @@ -118751,28 +127468,30 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 65536, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "knowledge": "2025-03", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 0.14, - "output": 0.86 + "input": 0.25, + "output": 0.25 }, "type": "chat" }, { - "id": "zai-org/GLM-5", - "name": "zai-org/GLM-5", - "display_name": "zai-org/GLM-5", + "id": "solar-mini", + "name": "solar-mini", + "display_name": "solar-mini", "modalities": { "input": [ "text" @@ -118782,52 +127501,40 @@ ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 32768, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2024-06-12", + "last_updated": "2025-04-22", "cost": { - "input": 1, - "output": 3.2 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6V", - "name": "zai-org/GLM-4.6V", - "display_name": "zai-org/GLM-4.6V", + "id": "solar-pro3", + "name": "solar-pro3", + "display_name": "solar-pro3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -118835,20 +127542,29 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-07", - "last_updated": "2025-12-07", + "knowledge": "2025-03", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.25, + "output": 0.25 }, "type": "chat" - }, + } + ] + }, + "amazon-bedrock": { + "id": "amazon-bedrock", + "name": "Amazon Bedrock", + "display_name": "Amazon Bedrock", + "doc": "https://docs.aws.amazon.com/bedrock/latest/userguide/models-supported.html", + "models": [ { - "id": "zai-org/GLM-4.6", - "name": "zai-org/GLM-4.6", - "display_name": "zai-org/GLM-4.6", + "id": "zai.glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -118858,65 +127574,78 @@ ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.5, - "output": 1.9 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5V", - "name": "zai-org/GLM-4.5V", - "display_name": "zai-org/GLM-4.5V", + "id": "global.anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5 (Global)", + "display_name": "Claude Sonnet 4.5 (Global)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 66000, - "output": 66000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-08-13", - "last_updated": "2025-11-25", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.14, - "output": 0.86 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", - "name": "meta-llama/Meta-Llama-3.1-8B-Instruct", - "display_name": "meta-llama/Meta-Llama-3.1-8B-Instruct", + "id": "qwen.qwen3-235b-a22b-2507-v1:0", + "name": "Qwen3 235B A22B 2507", + "display_name": "Qwen3 235B A22B 2507", "modalities": { "input": [ "text" @@ -118926,8 +127655,8 @@ ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -118935,19 +127664,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-23", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 0.06, - "output": 0.06 + "input": 0.22, + "output": 0.88 }, "type": "chat" }, { - "id": "inclusionAI/Ring-flash-2.0", - "name": "inclusionAI/Ring-flash-2.0", - "display_name": "inclusionAI/Ring-flash-2.0", + "id": "zai.glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -118957,8 +127687,8 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 202752, + "output": 101376 }, "temperature": true, "tool_call": true, @@ -118968,54 +127698,64 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.14, - "output": 0.57 + "input": 1, + "output": 3.2 }, "type": "chat" }, { - "id": "inclusionAI/Ling-mini-2.0", - "name": "inclusionAI/Ling-mini-2.0", - "display_name": "inclusionAI/Ling-mini-2.0", + "id": "amazon.nova-pro-v1:0", + "name": "Nova Pro", + "display_name": "Nova Pro", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 300000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-10", - "last_updated": "2025-11-25", + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.8, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "inclusionAI/Ling-flash-2.0", - "name": "inclusionAI/Ling-flash-2.0", - "display_name": "inclusionAI/Ling-flash-2.0", + "id": "openai.gpt-oss-20b-1:0", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ "text" @@ -119025,8 +127765,8 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -119035,49 +127775,55 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.07, + "output": 0.3 }, "type": "chat" }, { - "id": "tencent/Hunyuan-A13B-Instruct", - "name": "tencent/Hunyuan-A13B-Instruct", - "display_name": "tencent/Hunyuan-A13B-Instruct", + "id": "us.anthropic.claude-haiku-4-5-20251001-v1:0", + "name": "Claude Haiku 4.5 (US)", + "display_name": "Claude Haiku 4.5 (US)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-06-30", - "last_updated": "2025-11-25", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.14, - "output": 0.57 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "tencent/Hunyuan-MT-7B", - "name": "tencent/Hunyuan-MT-7B", - "display_name": "tencent/Hunyuan-MT-7B", + "id": "writer.palmyra-x4-v1:0", + "name": "Palmyra X4", + "display_name": "Palmyra X4", "modalities": { "input": [ "text" @@ -119087,28 +127833,29 @@ ] }, "limit": { - "context": 33000, - "output": 33000 + "context": 122880, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 0, - "output": 0 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1", - "name": "deepseek-ai/DeepSeek-V3.1", - "display_name": "deepseek-ai/DeepSeek-V3.1", + "id": "moonshot.kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -119118,8 +127865,8 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -119127,42 +127874,47 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true + } + }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-25", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0.27, - "output": 1 + "input": 0.6, + "output": 2.5 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-vl2", - "name": "deepseek-ai/deepseek-vl2", - "display_name": "deepseek-ai/deepseek-vl2", + "id": "mistral.ministral-3-8b-instruct", + "name": "Ministral 3 8B", + "display_name": "Ministral 3 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 4000, - "output": 4000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-12-13", - "last_updated": "2025-11-25", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { "input": 0.15, "output": 0.15 @@ -119170,51 +127922,55 @@ "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3", - "name": "deepseek-ai/DeepSeek-V3", - "display_name": "deepseek-ai/DeepSeek-V3", + "id": "meta.llama4-scout-17b-instruct-v1:0", + "name": "Llama 4 Scout 17B Instruct", + "display_name": "Llama 4 Scout 17B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 3500000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2024-12-26", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.25, - "output": 1 + "input": 0.17, + "output": 0.66 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "id": "us.anthropic.claude-opus-4-5-20251101-v1:0", + "name": "Claude Opus 4.5 (US)", + "display_name": "Claude Opus 4.5 (US)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -119222,20 +127978,23 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-11-25", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "cost": { - "input": 0.18, - "output": 0.18 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1", - "name": "deepseek-ai/DeepSeek-R1", - "display_name": "deepseek-ai/DeepSeek-R1", + "id": "qwen.qwen3-coder-480b-a35b-v1:0", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -119245,72 +128004,62 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 0.5, - "output": 2.18 + "input": 0.22, + "output": 1.8 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "id": "google.gemma-3-27b-it", + "name": "Google Gemma 3 27B Instruct", + "display_name": "Google Gemma 3 27B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 202752, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-27", + "last_updated": "2025-07-27", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.12, + "output": 0.2 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2-Exp", - "name": "deepseek-ai/DeepSeek-V3.2-Exp", - "display_name": "deepseek-ai/DeepSeek-V3.2-Exp", + "id": "mistral.ministral-3-14b-instruct", + "name": "Ministral 14B 3.0", + "display_name": "Ministral 14B 3.0", "modalities": { "input": [ "text" @@ -119320,40 +128069,41 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-10-10", - "last_updated": "2025-11-25", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.27, - "output": 0.41 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "deepseek-ai/DeepSeek-V3.2", - "display_name": "deepseek-ai/DeepSeek-V3.2", + "id": "us.anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5 (US)", + "display_name": "Claude Sonnet 4.5 (US)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -119361,25 +128111,23 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-03", - "last_updated": "2025-12-03", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.27, - "output": 0.42 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "deepseek-ai/DeepSeek-V3.1-Terminus", - "display_name": "deepseek-ai/DeepSeek-V3.1-Terminus", + "id": "qwen.qwen3-coder-30b-a3b-v1:0", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ "text" @@ -119389,65 +128137,90 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 0.27, - "output": 1 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "openai/gpt-oss-20b", - "display_name": "openai/gpt-oss-20b", + "id": "anthropic.claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 8000 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-13", - "last_updated": "2025-11-25", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.04, - "output": 0.18 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "openai/gpt-oss-120b", - "display_name": "openai/gpt-oss-120b", + "id": "zai.glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ "text" @@ -119457,8 +128230,8 @@ ] }, "limit": { - "context": 131000, - "output": 8000 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -119466,67 +128239,67 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-13", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.05, - "output": 0.45 + "input": 0.07, + "output": 0.4 }, "type": "chat" }, { - "id": "baidu/ERNIE-4.5-300B-A47B", - "name": "baidu/ERNIE-4.5-300B-A47B", - "display_name": "baidu/ERNIE-4.5-300B-A47B", + "id": "google.gemma-3-12b-it", + "name": "Google Gemma 3 12B", + "display_name": "Google Gemma 3 12B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-07-02", - "last_updated": "2025-11-25", + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.28, - "output": 1.1 + "input": 0.049999999999999996, + "output": 0.09999999999999999 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-9B-0414", - "name": "THUDM/GLM-Z1-9B-0414", - "display_name": "THUDM/GLM-Z1-9B-0414", + "id": "global.anthropic.claude-opus-4-5-20251101-v1:0", + "name": "Claude Opus 4.5 (Global)", + "display_name": "Claude Opus 4.5 (Global)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -119534,51 +128307,118 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "cost": { - "input": 0.086, - "output": 0.086 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "THUDM/GLM-4-9B-0414", - "name": "THUDM/GLM-4-9B-0414", - "display_name": "THUDM/GLM-4-9B-0414", + "id": "au.anthropic.claude-sonnet-4-6", + "name": "AU Anthropic Claude Sonnet 4.6", + "display_name": "AU Anthropic Claude Sonnet 4.6", "modalities": { "input": [ + "text", + "image", + "pdf" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 1000000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", + "cost": { + "input": 3.3, + "output": 16.5, + "cache_read": 0.33, + "cache_write": 4.125 + }, + "type": "chat" + }, + { + "id": "qwen.qwen3-vl-235b-a22b", + "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "modalities": { + "input": [ + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 33000, - "output": 33000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-18", + "release_date": "2025-10-04", "last_updated": "2025-11-25", "cost": { - "input": 0.086, - "output": 0.086 + "input": 0.3, + "output": 1.5 }, "type": "chat" }, { - "id": "THUDM/GLM-4-32B-0414", - "name": "THUDM/GLM-4-32B-0414", - "display_name": "THUDM/GLM-4-32B-0414", + "id": "meta.llama3-3-70b-instruct-v1:0", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -119588,8 +128428,8 @@ ] }, "limit": { - "context": 33000, - "output": 33000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -119597,19 +128437,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.27, - "output": 0.27 + "input": 0.72, + "output": 0.72 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-32B-0414", - "name": "THUDM/GLM-Z1-32B-0414", - "display_name": "THUDM/GLM-Z1-32B-0414", + "id": "nvidia.nemotron-nano-9b-v2", + "name": "NVIDIA Nemotron Nano 9B v2", + "display_name": "NVIDIA Nemotron Nano 9B v2", "modalities": { "input": [ "text" @@ -119619,72 +128460,89 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.06, + "output": 0.23 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "moonshotai/Kimi-K2-Thinking", - "display_name": "moonshotai/Kimi-K2-Thinking", + "id": "us.anthropic.claude-opus-4-7", + "name": "Claude Opus 4.7 (US)", + "display_name": "Claude Opus 4.7 (US)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], "interleaved": true, "summaries": true, - "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-11-07", - "last_updated": "2025-11-25", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.55, - "output": 2.5 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "moonshotai/Kimi-K2.6", - "display_name": "moonshotai/Kimi-K2.6", + "id": "nvidia.nemotron-nano-12b-v2", + "name": "NVIDIA Nemotron Nano 12B v2 VL BF16", + "display_name": "NVIDIA Nemotron Nano 12B v2 VL BF16", "modalities": { "input": [ "text", @@ -119695,72 +128553,65 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct", - "name": "moonshotai/Kimi-K2-Instruct", - "display_name": "moonshotai/Kimi-K2-Instruct", + "id": "anthropic.claude-opus-4-5-20251101-v1:0", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-13", - "last_updated": "2025-11-25", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "cost": { - "input": 0.58, - "output": 2.29 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "moonshotai/Kimi-K2-Instruct-0905", - "display_name": "moonshotai/Kimi-K2-Instruct-0905", + "id": "deepseek.v3-v1:0", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ "text" @@ -119770,28 +128621,30 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 163840, + "output": 81920 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-08", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 0.4, - "output": 2 + "input": 0.58, + "output": 1.68 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "moonshotai/Kimi-K2.5", - "display_name": "moonshotai/Kimi-K2.5", + "id": "meta.llama4-maverick-17b-instruct-v1:0", + "name": "Llama 4 Maverick 17B Instruct", + "display_name": "Llama 4 Maverick 17B Instruct", "modalities": { "input": [ "text", @@ -119802,76 +128655,90 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1000000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.45, - "output": 2.25 + "input": 0.24, + "output": 0.97 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMaxAI/MiniMax-M2.5", - "display_name": "MiniMaxAI/MiniMax-M2.5", + "id": "eu.anthropic.claude-opus-4-7", + "name": "Claude Opus 4.7 (EU)", + "display_name": "Claude Opus 4.7 (EU)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 197000, - "output": 131000 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-15", - "last_updated": "2026-02-15", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.3, - "output": 1.2 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.1", - "name": "MiniMaxAI/MiniMax-M2.1", - "display_name": "MiniMaxAI/MiniMax-M2.1", + "id": "qwen.qwen3-32b-v1:0", + "name": "Qwen3 32B (dense)", + "display_name": "Qwen3 32B (dense)", "modalities": { "input": [ "text" @@ -119881,77 +128748,65 @@ ] }, "limit": { - "context": 197000, - "output": 131000 + "context": 16384, + "output": 16384 }, "temperature": true, "tool_call": true, - "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "reasoning": { + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "ByteDance-Seed/Seed-OSS-36B-Instruct", - "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", - "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "id": "amazon.nova-lite-v1:0", + "name": "Nova Lite", + "display_name": "Nova Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 300000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-04", - "last_updated": "2025-11-25", + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.21, - "output": 0.57 + "input": 0.06, + "output": 0.24, + "cache_read": 0.015 }, "type": "chat" - } - ] - }, - "vercel": { - "id": "vercel", - "name": "Vercel AI Gateway", - "display_name": "Vercel AI Gateway", - "doc": "https://github.com/vercel/ai/tree/5eb85cc45a259553501f535b8ac79a77d0e79223/packages/gateway", - "models": [ + }, { - "id": "alibaba/qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "mistral.devstral-2-123b", + "name": "Devstral 2 123B", + "display_name": "Devstral 2 123B", "modalities": { "input": [ "text" @@ -119961,8 +128816,8 @@ ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -119971,19 +128826,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 1, - "output": 5 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "alibaba/qwen3.6-27b", - "name": "Qwen 3.6 27B", - "display_name": "Qwen 3.6 27B", + "id": "eu.anthropic.claude-opus-4-5-20251101-v1:0", + "name": "Claude Opus 4.5 (EU)", + "display_name": "Claude Opus 4.5 (EU)", "modalities": { "input": [ "text", @@ -119995,8 +128849,8 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -120004,31 +128858,23 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, "open_weights": false, - "release_date": "2026-04-22", - "last_updated": "2026-05-01", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "cost": { - "input": 0.6, - "output": 3.5999999999999996 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "alibaba/qwen3-embedding-8b", - "name": "Qwen3 Embedding 8B", - "display_name": "Qwen3 Embedding 8B", + "id": "openai.gpt-oss-120b-1:0", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ "text" @@ -120038,28 +128884,28 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 16384 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.05, - "output": 0 + "input": 0.15, + "output": 0.6 }, - "type": "embedding" + "type": "chat" }, { - "id": "alibaba/qwen-3-30b", - "name": "Qwen3-30B-A3B", - "display_name": "Qwen3-30B-A3B", + "id": "deepseek.r1-v1:0", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -120069,8 +128915,8 @@ ] }, "limit": { - "context": 40960, - "output": 16384 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -120080,30 +128926,31 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", "cost": { - "input": 0.08, - "output": 0.29 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "alibaba/qwen-3-235b", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "mistral.mistral-large-3-675b-instruct", + "name": "Mistral Large 3", + "display_name": "Mistral Large 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 16384 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -120111,33 +128958,31 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": true, + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0.13, - "output": 0.6 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "alibaba/qwen3.5-flash", - "name": "Qwen 3.5 Flash", - "display_name": "Qwen 3.5 Flash", + "id": "mistral.magistral-small-2509", + "name": "Magistral Small 1.2", + "display_name": "Magistral Small 1.2", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 40000 }, "temperature": true, "tool_call": true, @@ -120145,82 +128990,55 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.001, - "cache_write": 0.125 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "alibaba/qwen3.6-plus", - "name": "Qwen 3.6 Plus", - "display_name": "Qwen 3.6 Plus", + "id": "mistral.pixtral-large-2502-v1:0", + "name": "Pixtral Large (25.02)", + "display_name": "Pixtral Large (25.02)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-03", + "release_date": "2025-04-08", + "last_updated": "2025-04-08", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.09999999999999999, - "cache_write": 0.625 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "alibaba/qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "mistral.voxtral-mini-3b-2507", + "name": "Voxtral Mini 3B 2507", + "display_name": "Voxtral Mini 3B 2507", "modalities": { "input": [ + "audio", "text" ], "output": [ @@ -120228,40 +129046,28 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 1.2, - "output": 6 + "input": 0.04, + "output": 0.04 }, "type": "chat" }, { - "id": "alibaba/qwen3-embedding-0.6b", - "name": "Qwen3 Embedding 0.6B", - "display_name": "Qwen3 Embedding 0.6B", + "id": "writer.palmyra-x5-v1:0", + "name": "Palmyra X5", + "display_name": "Palmyra X5", "modalities": { "input": [ "text" @@ -120271,28 +129077,29 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 1040000, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 0.01, - "output": 0 + "input": 0.6, + "output": 6 }, - "type": "embedding" + "type": "chat" }, { - "id": "alibaba/qwen-3-32b", - "name": "Qwen 3.32B", - "display_name": "Qwen 3.32B", + "id": "minimax.minimax-m2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "modalities": { "input": [ "text" @@ -120302,8 +129109,8 @@ ] }, "limit": { - "context": 40960, - "output": 16384 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -120312,158 +129119,190 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "alibaba/qwen-3.6-max-preview", - "name": "Qwen 3.6 Max Preview", - "display_name": "Qwen 3.6 Max Preview", + "id": "qwen.qwen3-next-80b-a3b", + "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 240000, - "output": 64000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-20", - "last_updated": "2026-04-24", + "attachment": false, + "open_weights": false, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 1.3, - "output": 7.8, - "cache_read": 0.26, - "cache_write": 1.625 + "input": 0.14, + "output": 1.4 }, "type": "chat" }, { - "id": "alibaba/qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "au.anthropic.claude-opus-4-6-v1", + "name": "AU Anthropic Claude Opus 4.6", + "display_name": "AU Anthropic Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "cost": { + "input": 16.5, + "output": 82.5, + "cache_read": 1.65, + "cache_write": 20.625 + }, + "type": "chat" + }, + { + "id": "meta.llama3-1-8b-instruct-v1:0", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, "attachment": false, "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-09-12", - "last_updated": "2025-09-12", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.15, - "output": 1.5 + "input": 0.22, + "output": 0.22 }, "type": "chat" }, { - "id": "alibaba/qwen3-vl-thinking", - "name": "Qwen3 VL Thinking", - "display_name": "Qwen3 VL Thinking", + "id": "amazon.nova-2-lite-v1:0", + "name": "Nova 2 Lite", + "display_name": "Nova 2 Lite", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 129024 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "attachment": false, + "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.7, - "output": 8.4 + "input": 0.33, + "output": 2.75 }, "type": "chat" }, { - "id": "alibaba/qwen3-235b-a22b-thinking", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "moonshotai.kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262114, - "output": 262114 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -120474,29 +129313,23 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "interleaved": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-06", + "last_updated": "2026-02-06", "cost": { - "input": 0.3, - "output": 2.9 + "input": 0.6, + "output": 3 }, "type": "chat" }, { - "id": "alibaba/qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "nvidia.nemotron-super-3-120b", + "name": "NVIDIA Nemotron 3 Super 120B A12B", + "display_name": "NVIDIA Nemotron 3 Super 120B A12B", "modalities": { "input": [ "text" @@ -120507,26 +129340,26 @@ }, "limit": { "context": 262144, - "output": 32768 + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-12", - "last_updated": "2025-09-12", + "release_date": "2026-03-11", + "last_updated": "2026-03-11", "cost": { - "input": 0.09, - "output": 1.1 + "input": 0.15, + "output": 0.65 }, "type": "chat" }, { - "id": "alibaba/qwen3-coder-next", + "id": "qwen.qwen3-coder-next", "name": "Qwen3 Coder Next", "display_name": "Qwen3 Coder Next", "modalities": { @@ -120538,8 +129371,8 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -120548,61 +129381,64 @@ "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-22", - "last_updated": "2026-02-19", + "open_weights": true, + "release_date": "2026-02-06", + "last_updated": "2026-02-06", "cost": { - "input": 0.5, - "output": 1.2 + "input": 0.22, + "output": 1.8 }, "type": "chat" }, { - "id": "alibaba/qwen3-embedding-4b", - "name": "Qwen3 Embedding 4B", - "display_name": "Qwen3 Embedding 4B", + "id": "mistral.ministral-3-3b-instruct", + "name": "Ministral 3 3B", + "display_name": "Ministral 3 3B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 256000, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "open_weights": true, + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0.02, - "output": 0 + "input": 0.1, + "output": 0.1 }, - "type": "embedding" + "type": "chat" }, { - "id": "alibaba/qwen3-max-thinking", - "name": "Qwen 3 Max Thinking", - "display_name": "Qwen 3 Max Thinking", + "id": "eu.anthropic.claude-haiku-4-5-20251001-v1:0", + "name": "Claude Haiku 4.5 (EU)", + "display_name": "Claude Haiku 4.5 (EU)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -120610,65 +129446,55 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01", - "last_updated": "2025-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 1.2, - "output": 6, - "cache_read": 0.24 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "alibaba/qwen3-vl-235b-a22b-instruct", - "name": "Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen3 VL 235B A22B Instruct", + "id": "minimax.minimax-m2", + "name": "MiniMax M2", + "display_name": "MiniMax M2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 129024 + "context": 204608, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-24", - "last_updated": "2026-05-01", + "attachment": false, + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 0.39999999999999997, - "output": 1.5999999999999999 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "alibaba/qwen3-coder", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "meta.llama3-1-70b-instruct-v1:0", + "name": "Llama 3.1 70B Instruct", + "display_name": "Llama 3.1 70B Instruct", "modalities": { "input": [ "text" @@ -120678,8 +129504,8 @@ ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -120687,20 +129513,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.38, - "output": 1.53 + "input": 0.72, + "output": 0.72 }, "type": "chat" }, { - "id": "alibaba/qwen3-max-preview", - "name": "Qwen3 Max Preview", - "display_name": "Qwen3 Max Preview", + "id": "openai.gpt-oss-safeguard-120b", + "name": "GPT OSS Safeguard 120B", + "display_name": "GPT OSS Safeguard 120B", "modalities": { "input": [ "text" @@ -120710,41 +129536,28 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "release_date": "2025-10-29", + "last_updated": "2025-10-29", "cost": { - "input": 1.2, - "output": 6, - "cache_read": 0.24 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "alibaba/qwen3.5-plus", - "name": "Qwen 3.5 Plus", - "display_name": "Qwen 3.5 Plus", + "id": "global.anthropic.claude-haiku-4-5-20251001-v1:0", + "name": "Claude Haiku 4.5 (Global)", + "display_name": "Claude Haiku 4.5 (Global)", "modalities": { "input": [ "text", @@ -120756,7 +129569,7 @@ ] }, "limit": { - "context": 1000000, + "context": 200000, "output": 64000 }, "temperature": true, @@ -120765,33 +129578,23 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, "open_weights": false, - "release_date": "2026-02-16", - "last_updated": "2026-02-19", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.4, - "output": 2.4, - "cache_read": 0.04, - "cache_write": 0.5 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "alibaba/qwen-3-14b", - "name": "Qwen3-14B", - "display_name": "Qwen3-14B", + "id": "amazon.nova-micro-v1:0", + "name": "Nova Micro", + "display_name": "Nova Micro", "modalities": { "input": [ "text" @@ -120801,74 +129604,80 @@ ] }, "limit": { - "context": 40960, - "output": 16384 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.06, - "output": 0.24 + "input": 0.035, + "output": 0.14, + "cache_read": 0.00875 }, "type": "chat" }, { - "id": "alibaba/qwen3-vl-instruct", - "name": "Qwen3 VL Instruct", - "display_name": "Qwen3 VL Instruct", + "id": "anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 129024 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.7, - "output": 2.8 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "alibaba/qwen3-coder-30b-a3b", - "name": "Qwen 3 Coder 30B A3B Instruct", - "display_name": "Qwen 3 Coder 30B A3B Instruct", + "id": "eu.anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5 (EU)", + "display_name": "Claude Sonnet 4.5 (EU)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 160000, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -120876,33 +129685,35 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.07, - "output": 0.27 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "perplexity/sonar-pro", - "name": "Sonar Pro", - "display_name": "Sonar Pro", + "id": "mistral.voxtral-small-24b-2507", + "name": "Voxtral Small 24B 2507", + "display_name": "Voxtral Small 24B 2507", "modalities": { "input": [ "text", - "image" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8000 + "context": 32000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -120910,159 +129721,181 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "open_weights": true, + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 3, - "output": 15 + "input": 0.15, + "output": 0.35 }, "type": "chat" }, { - "id": "perplexity/sonar", - "name": "Sonar", - "display_name": "Sonar", + "id": "nvidia.nemotron-nano-3-30b", + "name": "NVIDIA Nemotron Nano 3 30B", + "display_name": "NVIDIA Nemotron Nano 3 30B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 127000, - "output": 8000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 1, - "output": 1 + "input": 0.06, + "output": 0.24 }, "type": "chat" }, { - "id": "perplexity/sonar-reasoning", - "name": "Sonar Reasoning", - "display_name": "Sonar Reasoning", + "id": "anthropic.claude-haiku-4-5-20251001-v1:0", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 127000, - "output": 8000 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { "input": 1, - "output": 5 + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "perplexity/sonar-reasoning-pro", - "name": "Sonar Reasoning Pro", - "display_name": "Sonar Reasoning Pro", + "id": "google.gemma-3-4b-it", + "name": "Gemma 3 4B IT", + "display_name": "Gemma 3 4B IT", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 127000, - "output": 8000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 2, - "output": 8 + "input": 0.04, + "output": 0.08 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-thinking", - "name": "DeepSeek V3.2 Thinking", - "display_name": "DeepSeek V3.2 Thinking", + "id": "global.anthropic.claude-opus-4-7", + "name": "Claude Opus 4.7 (Global)", + "display_name": "Claude Opus 4.7 (Global)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.28, - "output": 0.42, - "cache_read": 0.03 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-exp", - "name": "DeepSeek V3.2 Exp", - "display_name": "DeepSeek V3.2 Exp", + "id": "minimax.minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -121072,8 +129905,8 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 196608, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -121082,20 +129915,50 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0.3, + "output": 1.2 + }, + "type": "chat" + }, + { + "id": "openai.gpt-oss-safeguard-20b", + "name": "GPT OSS Safeguard 20B", + "display_name": "GPT OSS Safeguard 20B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-10-29", + "last_updated": "2025-10-29", "cost": { - "input": 0.27, - "output": 0.4 + "input": 0.07, + "output": 0.2 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1", - "name": "DeepSeek-V3.1", - "display_name": "DeepSeek-V3.1", + "id": "deepseek.v3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ "text" @@ -121106,7 +129969,7 @@ }, "limit": { "context": 163840, - "output": 128000 + "output": 81920 }, "temperature": true, "tool_call": true, @@ -121115,23 +129978,25 @@ "default": true }, "attachment": false, - "open_weights": false, + "open_weights": true, "knowledge": "2024-07", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "release_date": "2026-02-06", + "last_updated": "2026-02-06", "cost": { - "input": 0.3, - "output": 1 + "input": 0.62, + "output": 1.85 }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "global.anthropic.claude-opus-4-6-v1", + "name": "Claude Opus 4.6 (Global)", + "display_name": "Claude Opus 4.6 (Global)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -121139,43 +130004,62 @@ }, "limit": { "context": 1000000, - "output": 384000 + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-23", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "anthropic.claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -121183,88 +130067,131 @@ }, "limit": { "context": 1000000, - "output": 384000 + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-23", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "global.anthropic.claude-sonnet-4-6", + "name": "Claude Sonnet 4.6 (Global)", + "display_name": "Claude Sonnet 4.6 (Global)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163842, - "output": 8000 + "context": 1000000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.27, - "output": 0.4, - "cache_read": 0.22 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "us.meta.llama4-maverick-17b-instruct-v1:0", + "name": "Llama 4 Maverick 17B Instruct (US)", + "display_name": "Llama 4 Maverick 17B Instruct (US)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, + "context": 1000000, "output": 16384 }, "temperature": true, @@ -121272,54 +130199,21 @@ "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-12-26", - "last_updated": "2024-12-26", - "cost": { - "input": 0.77, - "output": 0.77 - }, - "type": "chat" - }, - { - "id": "deepseek/deepseek-v3.1-terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 65536 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.27, - "output": 1 + "input": 0.24, + "output": 0.97 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "us.deepseek.r1-v1:0", + "name": "DeepSeek-R1 (US)", + "display_name": "DeepSeek-R1 (US)", "modalities": { "input": [ "text" @@ -121338,17 +130232,6 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": false, "knowledge": "2024-07", @@ -121361,52 +130244,59 @@ "type": "chat" }, { - "id": "arcee-ai/trinity-mini", - "name": "Trinity Mini", - "display_name": "Trinity Mini", + "id": "au.anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5 (AU)", + "display_name": "Claude Sonnet 4.5 (AU)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12", - "last_updated": "2025-12", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.05, - "output": 0.15 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "arcee-ai/trinity-large-thinking", - "name": "Trinity Large Thinking", - "display_name": "Trinity Large Thinking", + "id": "us.anthropic.claude-opus-4-1-20250805-v1:0", + "name": "Claude Opus 4.1 (US)", + "display_name": "Claude Opus 4.1 (US)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262100, - "output": 80000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -121414,342 +130304,614 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-03", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.25, - "output": 0.8999999999999999 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "arcee-ai/trinity-large-preview", - "name": "Trinity Large Preview", - "display_name": "Trinity Large Preview", + "id": "anthropic.claude-opus-4-1-20250805-v1:0", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-01", - "last_updated": "2025-01", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.25, - "output": 1 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "recraft/recraft-v3", - "name": "Recraft V3", - "display_name": "Recraft V3", + "id": "us.anthropic.claude-sonnet-4-6", + "name": "Claude Sonnet 4.6 (US)", + "display_name": "Claude Sonnet 4.6 (US)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 512, - "output": 8192 + "context": 1000000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-10", - "last_updated": "2024-10", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + }, "type": "chat" }, { - "id": "recraft/recraft-v2", - "name": "Recraft V2", - "display_name": "Recraft V2", + "id": "anthropic.claude-opus-4-6-v1", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 512, - "output": 8192 + "context": 1000000, + "output": 128000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-03", - "last_updated": "2024-03", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + }, "type": "chat" }, { - "id": "voyage/voyage-3-large", - "name": "voyage-3-large", - "display_name": "voyage-3-large", + "id": "eu.anthropic.claude-sonnet-4-6", + "name": "Claude Sonnet 4.6 (EU)", + "display_name": "Claude Sonnet 4.6 (EU)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 1000000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-09", - "last_updated": "2024-09", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.18, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "voyage/voyage-4-large", - "name": "voyage-4-large", - "display_name": "voyage-4-large", + "id": "eu.anthropic.claude-opus-4-6-v1", + "name": "Claude Opus 4.6 (EU)", + "display_name": "Claude Opus 4.6 (EU)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 1000000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-03-06", - "last_updated": "2026-03-06", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + }, "type": "chat" }, { - "id": "voyage/voyage-3.5-lite", - "name": "voyage-3.5-lite", - "display_name": "voyage-3.5-lite", + "id": "au.anthropic.claude-haiku-4-5-20251001-v1:0", + "name": "Claude Haiku 4.5 (AU)", + "display_name": "Claude Haiku 4.5 (AU)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 200000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.02, - "output": 0 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "voyage/voyage-code-3", - "name": "voyage-code-3", - "display_name": "voyage-code-3", + "id": "jp.anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5 (JP)", + "display_name": "Claude Sonnet 4.5 (JP)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 200000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-09", - "last_updated": "2024-09", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.18, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "voyage/voyage-finance-2", - "name": "voyage-finance-2", - "display_name": "voyage-finance-2", + "id": "jp.anthropic.claude-sonnet-4-6", + "name": "Claude Sonnet 4.6 (JP)", + "display_name": "Claude Sonnet 4.6 (JP)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 1000000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-03", - "last_updated": "2024-03", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.12, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "voyage/voyage-4-lite", - "name": "voyage-4-lite", - "display_name": "voyage-4-lite", + "id": "us.anthropic.claude-opus-4-6-v1", + "name": "Claude Opus 4.6 (US)", + "display_name": "Claude Opus 4.6 (US)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 1000000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-03-06", - "last_updated": "2026-03-06", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + }, "type": "chat" }, { - "id": "voyage/voyage-4", - "name": "voyage-4", - "display_name": "voyage-4", + "id": "us.meta.llama4-scout-17b-instruct-v1:0", + "name": "Llama 4 Scout 17B Instruct (US)", + "display_name": "Llama 4 Scout 17B Instruct (US)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 3500000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2026-03-06", - "last_updated": "2026-03-06", + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "cost": { + "input": 0.17, + "output": 0.66 + }, "type": "chat" }, { - "id": "voyage/voyage-code-2", - "name": "voyage-code-2", - "display_name": "voyage-code-2", + "id": "jp.anthropic.claude-opus-4-7", + "name": "Claude Opus 4.7 (JP)", + "display_name": "Claude Opus 4.7 (JP)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 1000000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-01", - "last_updated": "2024-01", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.12, - "output": 0 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" - }, + } + ] + }, + "vercel": { + "id": "vercel", + "name": "Vercel AI Gateway", + "display_name": "Vercel AI Gateway", + "doc": "https://github.com/vercel/ai/tree/5eb85cc45a259553501f535b8ac79a77d0e79223/packages/gateway", + "models": [ { - "id": "voyage/voyage-law-2", - "name": "voyage-law-2", - "display_name": "voyage-law-2", + "id": "prime-intellect/intellect-3", + "name": "INTELLECT 3", + "display_name": "INTELLECT 3", "modalities": { "input": [ "text" @@ -121759,28 +130921,30 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 131072, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2024-03", - "last_updated": "2024-03", + "knowledge": "2024-10", + "release_date": "2025-11-26", + "last_updated": "2025-11-26", "cost": { - "input": 0.12, - "output": 0 + "input": 0.2, + "output": 1.1 }, "type": "chat" }, { - "id": "voyage/voyage-3.5", - "name": "voyage-3.5", - "display_name": "voyage-3.5", + "id": "inception/mercury-edit-2", + "name": "Mercury Edit 2", + "display_name": "Mercury Edit 2", "modalities": { "input": [ "text" @@ -121790,28 +130954,30 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "release_date": "2026-03-30", + "last_updated": "2026-03-30", "cost": { - "input": 0.06, - "output": 0 + "input": 0.25, + "output": 0.75, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "morph/morph-v3-large", - "name": "Morph v3 Large", - "display_name": "Morph v3 Large", + "id": "inception/mercury-coder-small", + "name": "Mercury Coder Small Beta", + "display_name": "Mercury Coder Small Beta", "modalities": { "input": [ "text" @@ -121822,27 +130988,27 @@ }, "limit": { "context": 32000, - "output": 32000 + "output": 16384 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "release_date": "2025-02-26", + "last_updated": "2026-05-01", "cost": { - "input": 0.9, - "output": 1.9 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "morph/morph-v3-fast", - "name": "Morph v3 Fast", - "display_name": "Morph v3 Fast", + "id": "inception/mercury-2", + "name": "Mercury 2", + "display_name": "Mercury 2", "modalities": { "input": [ "text" @@ -121852,28 +131018,30 @@ ] }, "limit": { - "context": 16000, - "output": 16000 + "context": 128000, + "output": 128000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "release_date": "2026-02-24", + "last_updated": "2026-03-06", "cost": { - "input": 0.8, - "output": 1.2 + "input": 0.25, + "output": 0.75, + "cache_read": 0.024999999999999998 }, "type": "chat" }, { - "id": "zai/glm-5v-turbo", - "name": "GLM 5V Turbo", - "display_name": "GLM 5V Turbo", + "id": "zai/glm-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ "text", @@ -121885,8 +131053,8 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 202752, + "output": 202752 }, "temperature": true, "tool_call": true, @@ -121894,32 +131062,39 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-03", + "release_date": "2026-04-07", + "last_updated": "2026-04-16", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "zai/glm-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "zai/glm-5v-turbo", + "name": "GLM 5V Turbo", + "display_name": "GLM 5V Turbo", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 120000 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -121927,44 +131102,34 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2026-04-01", + "last_updated": "2026-04-03", "cost": { - "input": 0.43, - "output": 1.75, - "cache_read": 0.08 + "input": 1.2, + "output": 4, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "zai/glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "zai/glm-4.6v-flash", + "name": "GLM-4.6V-Flash", + "display_name": "GLM-4.6V-Flash", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202800, - "output": 131072 + "context": 128000, + "output": 24000 }, "temperature": true, "tool_call": true, @@ -121972,26 +131137,11 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-19", - "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 - }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "type": "chat" }, { @@ -122035,22 +131185,20 @@ "type": "chat" }, { - "id": "zai/glm-5.1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "zai/glm-4.5-air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 202752 + "context": 128000, + "output": 96000 }, "temperature": true, "tool_call": true, @@ -122058,39 +131206,33 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-07", - "last_updated": "2026-04-16", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 0.2, + "output": 1.1 }, "type": "chat" }, { - "id": "zai/glm-4.6v-flash", - "name": "GLM-4.6V-Flash", - "display_name": "GLM-4.6V-Flash", + "id": "zai/glm-4.5v", + "name": "GLM 4.5V", + "display_name": "GLM 4.5V", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 24000 + "context": 66000, + "output": 66000 }, "temperature": true, "tool_call": true, @@ -122099,16 +131241,57 @@ "default": true }, "attachment": true, + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", + "cost": { + "input": 0.6, + "output": 1.8 + }, + "type": "chat" + }, + { + "id": "zai/glm-4.7-flash", + "name": "GLM 4.7 Flash", + "display_name": "GLM 4.7 Flash", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 131000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "release_date": "2026-03-13", + "last_updated": "2026-03-13", + "cost": { + "input": 0.07, + "output": 0.39999999999999997 + }, "type": "chat" }, { - "id": "zai/glm-4.5", - "name": "GLM 4.5", - "display_name": "GLM 4.5", + "id": "zai/glm-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ "text" @@ -122118,8 +131301,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 96000 }, "temperature": true, "tool_call": true, @@ -122135,19 +131318,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0.45, + "output": 1.8 }, "type": "chat" }, { - "id": "zai/glm-4.5-air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "zai/glm-4.5", + "name": "GLM 4.5", + "display_name": "GLM 4.5", "modalities": { "input": [ "text" @@ -122157,8 +131340,8 @@ ] }, "limit": { - "context": 128000, - "output": 96000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -122166,14 +131349,20 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", + "knowledge": "2025-07", "release_date": "2025-07-28", "last_updated": "2025-07-28", "cost": { - "input": 0.2, - "output": 1.1 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, @@ -122216,21 +131405,20 @@ "type": "chat" }, { - "id": "zai/glm-4.5v", - "name": "GLM 4.5V", - "display_name": "GLM 4.5V", + "id": "zai/glm-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 66000, - "output": 66000 + "context": 202752, + "output": 120000 }, "temperature": true, "tool_call": true, @@ -122238,21 +131426,33 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.6, - "output": 1.8 + "input": 0.43, + "output": 1.75, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "zai/glm-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "zai/glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -122262,8 +131462,8 @@ ] }, "limit": { - "context": 200000, - "output": 96000 + "context": 202800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -122274,17 +131474,22 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "release_date": "2026-02-12", + "last_updated": "2026-02-19", "cost": { - "input": 0.45, - "output": 1.8 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, @@ -122325,9 +131530,9 @@ "type": "chat" }, { - "id": "zai/glm-4.7-flash", - "name": "GLM 4.7 Flash", - "display_name": "GLM 4.7 Flash", + "id": "cohere/embed-v4.0", + "name": "Embed v4.0", + "display_name": "Embed v4.0", "modalities": { "input": [ "text" @@ -122337,27 +131542,21 @@ ] }, "limit": { - "context": 200000, - "output": 131000 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-03-13", - "last_updated": "2026-03-13", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.07, - "output": 0.39999999999999997 + "input": 0.12, + "output": 0 }, "type": "chat" }, @@ -122394,9 +131593,9 @@ "type": "chat" }, { - "id": "cohere/embed-v4.0", - "name": "Embed v4.0", - "display_name": "Embed v4.0", + "id": "voyage/voyage-4-lite", + "name": "voyage-4-lite", + "display_name": "voyage-4-lite", "modalities": { "input": [ "text" @@ -122406,28 +131605,24 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 32000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", - "cost": { - "input": 0.12, - "output": 0 - }, + "release_date": "2026-03-06", + "last_updated": "2026-03-06", "type": "chat" }, { - "id": "prime-intellect/intellect-3", - "name": "INTELLECT 3", - "display_name": "INTELLECT 3", + "id": "voyage/voyage-4", + "name": "voyage-4", + "display_name": "voyage-4", "modalities": { "input": [ "text" @@ -122437,201 +131632,179 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 32000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-11-26", - "last_updated": "2025-11-26", - "cost": { - "input": 0.2, - "output": 1.1 - }, + "release_date": "2026-03-06", + "last_updated": "2026-03-06", "type": "chat" }, { - "id": "xai/grok-4.3", - "name": "Grok 4.3", - "display_name": "Grok 4.3", + "id": "voyage/voyage-3.5", + "name": "voyage-3.5", + "display_name": "voyage-3.5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-05-01", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.19999999999999998 + "input": 0.06, + "output": 0 }, "type": "chat" }, { - "id": "xai/grok-4.20-non-reasoning", - "name": "Grok 4.20 Non-Reasoning", - "display_name": "Grok 4.20 Non-Reasoning", + "id": "voyage/voyage-law-2", + "name": "voyage-law-2", + "display_name": "voyage-law-2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-23", + "release_date": "2024-03", + "last_updated": "2024-03", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.19999999999999998 + "input": 0.12, + "output": 0 }, "type": "chat" }, { - "id": "xai/grok-4.20-non-reasoning-beta", - "name": "Grok 4.20 Beta Non-Reasoning", - "display_name": "Grok 4.20 Beta Non-Reasoning", + "id": "voyage/voyage-3.5-lite", + "name": "voyage-3.5-lite", + "display_name": "voyage-3.5-lite", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-11", - "last_updated": "2026-03-13", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.19999999999999998 + "input": 0.02, + "output": 0 }, "type": "chat" }, { - "id": "xai/grok-4.20-reasoning", - "name": "Grok 4.20 Reasoning", - "display_name": "Grok 4.20 Reasoning", + "id": "voyage/voyage-3-large", + "name": "voyage-3-large", + "display_name": "voyage-3-large", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-23", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.19999999999999998 + "input": 0.18, + "output": 0 }, "type": "chat" }, { - "id": "xai/grok-imagine-image", - "name": "Grok Imagine Image", - "display_name": "Grok Imagine Image", + "id": "voyage/voyage-finance-2", + "name": "voyage-finance-2", + "display_name": "voyage-finance-2", "modalities": { "input": [ "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { "context": 8192, - "output": 8192 + "output": 1536 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-01-28", - "last_updated": "2026-02-19", + "release_date": "2024-03", + "last_updated": "2024-03", + "cost": { + "input": 0.12, + "output": 0 + }, "type": "chat" }, { - "id": "xai/grok-4.20-multi-agent-beta", - "name": "Grok 4.20 Multi Agent Beta", - "display_name": "Grok 4.20 Multi Agent Beta", + "id": "voyage/voyage-code-2", + "name": "voyage-code-2", + "display_name": "voyage-code-2", "modalities": { "input": [ "text" @@ -122641,41 +131814,38 @@ ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-03-11", - "last_updated": "2026-03-13", + "release_date": "2024-01", + "last_updated": "2024-01", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.19999999999999998 + "input": 0.12, + "output": 0 }, "type": "chat" }, { - "id": "xai/grok-imagine-image-pro", - "name": "Grok Imagine Image Pro", - "display_name": "Grok Imagine Image Pro", + "id": "voyage/voyage-4-large", + "name": "voyage-4-large", + "display_name": "voyage-4-large", "modalities": { "input": [ "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 8192, + "context": 32000, "output": 8192 }, "temperature": true, @@ -122685,14 +131855,14 @@ }, "attachment": false, "open_weights": false, - "release_date": "2026-01-28", - "last_updated": "2026-02-19", + "release_date": "2026-03-06", + "last_updated": "2026-03-06", "type": "chat" }, { - "id": "xai/grok-4-fast-reasoning", - "name": "Grok 4 Fast Reasoning", - "display_name": "Grok 4 Fast Reasoning", + "id": "voyage/voyage-code-3", + "name": "voyage-code-3", + "display_name": "voyage-code-3", "modalities": { "input": [ "text" @@ -122702,36 +131872,28 @@ ] }, "limit": { - "context": 2000000, - "output": 256000 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.18, + "output": 0 }, "type": "chat" }, { - "id": "xai/grok-4.1-fast-non-reasoning", - "name": "Grok 4.1 Fast Non-Reasoning", - "display_name": "Grok 4.1 Fast Non-Reasoning", + "id": "bytedance/seed-1.6", + "name": "Seed 1.6", + "display_name": "Seed 1.6", "modalities": { "input": [ "text" @@ -122741,43 +131903,43 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, "knowledge": "2024-10", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 0.2, - "output": 0.5, + "input": 0.25, + "output": 2, "cache_read": 0.05 }, "type": "chat" }, { - "id": "xai/grok-4.20-reasoning-beta", - "name": "Grok 4.20 Beta Reasoning", - "display_name": "Grok 4.20 Beta Reasoning", + "id": "bytedance/seed-1.8", + "name": "Seed 1.8", + "display_name": "Seed 1.8", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -122785,122 +131947,203 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-11", - "last_updated": "2026-03-13", + "knowledge": "2024-10", + "release_date": "2025-10", + "last_updated": "2025-10", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.19999999999999998 + "input": 0.25, + "output": 2, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "xai/grok-4.20-multi-agent", - "name": "Grok 4.20 Multi-Agent", - "display_name": "Grok 4.20 Multi-Agent", + "id": "bfl/flux-pro-1.0-fill", + "name": "FLUX.1 Fill [pro]", + "display_name": "FLUX.1 Fill [pro]", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 512, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-23", - "cost": { - "input": 2, - "output": 6, - "cache_read": 0.19999999999999998 + "release_date": "2024-10", + "last_updated": "2024-10", + "type": "chat" + }, + { + "id": "bfl/flux-kontext-max", + "name": "FLUX.1 Kontext Max", + "display_name": "FLUX.1 Kontext Max", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 512, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false }, + "attachment": false, + "open_weights": false, + "release_date": "2025-06", + "last_updated": "2025-06", "type": "chat" }, { - "id": "xai/grok-4.1-fast-reasoning", - "name": "Grok 4.1 Fast Reasoning", - "display_name": "Grok 4.1 Fast Reasoning", + "id": "bfl/flux-pro-1.1", + "name": "FLUX1.1 [pro]", + "display_name": "FLUX1.1 [pro]", "modalities": { "input": [ "text" ], "output": [ + "image" + ] + }, + "limit": { + "context": 512, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-10", + "last_updated": "2024-10", + "type": "chat" + }, + { + "id": "bfl/flux-pro-1.1-ultra", + "name": "FLUX1.1 [pro] Ultra", + "display_name": "FLUX1.1 [pro] Ultra", + "modalities": { + "input": [ "text" + ], + "output": [ + "image" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 512, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", - "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "release_date": "2024-11", + "last_updated": "2024-11", + "type": "chat" + }, + { + "id": "bfl/flux-kontext-pro", + "name": "FLUX.1 Kontext Pro", + "display_name": "FLUX.1 Kontext Pro", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 512, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false }, + "attachment": false, + "open_weights": false, + "release_date": "2025-06", + "last_updated": "2025-06", "type": "chat" }, { - "id": "xai/grok-4-fast-non-reasoning", - "name": "Grok 4 Fast (Non-Reasoning)", - "display_name": "Grok 4 Fast (Non-Reasoning)", + "id": "moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-26", + "last_updated": "2026-01-26", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.6, + "output": 1.2 }, "type": "chat" }, { - "id": "xai/grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "moonshotai/kimi-k2-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -122911,29 +132154,28 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0.6, + "output": 2.5 }, "type": "chat" }, { - "id": "xai/grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "moonshotai/kimi-k2-turbo", + "name": "Kimi K2 Turbo", + "display_name": "Kimi K2 Turbo", "modalities": { "input": [ "text" @@ -122943,66 +132185,74 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2024-08", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.3, - "output": 0.5, - "reasoning": 0.5, - "cache_read": 0.075 + "input": 2.4, + "output": 10 }, "type": "chat" }, { - "id": "xai/grok-2-vision", - "name": "Grok 2 Vision", - "display_name": "Grok 2 Vision", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 216144, + "output": 216144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, "knowledge": "2024-08", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 + "input": 0.47, + "output": 2, + "cache_read": 0.14 }, "type": "chat" }, { - "id": "xai/grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "moonshotai/kimi-k2-thinking-turbo", + "name": "Kimi K2 Thinking Turbo", + "display_name": "Kimi K2 Thinking Turbo", "modalities": { "input": [ "text" @@ -123012,8 +132262,8 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 262114, + "output": 262114 }, "temperature": true, "tool_call": true, @@ -123023,37 +132273,39 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true } }, "attachment": false, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 3, - "output": 15, - "reasoning": 15, - "cache_read": 0.75 + "input": 1.15, + "output": 8, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "xai/grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "moonshotai/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -123066,22 +132318,21 @@ "supported": true } }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-20", + "last_updated": "2026-04-24", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "xai/grok-3-fast", - "name": "Grok 3 Fast", - "display_name": "Grok 3 Fast", + "id": "moonshotai/kimi-k2", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -123092,7 +132343,7 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -123100,21 +132351,53 @@ "supported": false }, "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", + "cost": { + "input": 1, + "output": 3 + }, + "type": "chat" + }, + { + "id": "mistral/mistral-medium", + "name": "Mistral Medium 3.1", + "display_name": "Mistral Medium 3.1", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2024-10", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 5, - "output": 25, - "cache_read": 1.25 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "xai/grok-3-mini-fast", - "name": "Grok 3 Mini Fast", - "display_name": "Grok 3 Mini Fast", + "id": "mistral/devstral-2", + "name": "Devstral 2", + "display_name": "Devstral 2", "modalities": { "input": [ "text" @@ -123124,32 +132407,56 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2024-10", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", + "type": "chat" + }, + { + "id": "mistral/codestral-embed", + "name": "Codestral Embed", + "display_name": "Codestral Embed", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 1536 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.6, - "output": 4, - "reasoning": 4, - "cache_read": 0.15 + "input": 0.15, + "output": 0 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-super-120b-a12b", - "name": "NVIDIA Nemotron 3 Super 120B A12B", - "display_name": "NVIDIA Nemotron 3 Super 120B A12B", + "id": "mistral/mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -123158,29 +132465,63 @@ "text" ] }, + "limit": { + "context": 60288, + "output": 16000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", + "cost": { + "input": 0.04, + "output": 0.17 + }, + "type": "chat" + }, + { + "id": "mistral/mistral-large-3", + "name": "Mistral Large 3", + "display_name": "Mistral Large 3", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, "limit": { "context": 256000, - "output": 32000 + "output": 256000 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-18", - "last_updated": "2026-03-30", + "knowledge": "2024-10", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0.15, - "output": 0.65 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-nano-30b-a3b", - "name": "Nemotron 3 Nano 30B A3B", - "display_name": "Nemotron 3 Nano 30B A3B", + "id": "mistral/devstral-small-2", + "name": "Devstral Small 2", + "display_name": "Devstral Small 2", "modalities": { "input": [ "text" @@ -123190,97 +132531,91 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 256000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, "knowledge": "2024-10", - "release_date": "2024-12", - "last_updated": "2024-12", - "cost": { - "input": 0.06, - "output": 0.24 - }, + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "type": "chat" }, { - "id": "nvidia/nemotron-nano-12b-v2-vl", - "name": "Nvidia Nemotron Nano 12B V2 VL", - "display_name": "Nvidia Nemotron Nano 12B V2 VL", + "id": "mistral/devstral-small", + "name": "Devstral Small 1.1", + "display_name": "Devstral Small 1.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2024-10", - "release_date": "2024-12", - "last_updated": "2024-12", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0.2, - "output": 0.6 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "nvidia/nemotron-nano-9b-v2", - "name": "Nvidia Nemotron Nano 9B V2", - "display_name": "Nvidia Nemotron Nano 9B V2", + "id": "mistral/ministral-14b", + "name": "Ministral 14B", + "display_name": "Ministral 14B", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 256000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, "knowledge": "2024-10", - "release_date": "2025-08-18", - "last_updated": "2025-08-18", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.04, - "output": 0.16 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "inception/mercury-edit-2", - "name": "Mercury Edit 2", - "display_name": "Mercury Edit 2", + "id": "mistral/mistral-embed", + "name": "Mistral Embed", + "display_name": "Mistral Embed", "modalities": { "input": [ "text" @@ -123290,30 +132625,28 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 8192, + "output": 1536 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-03-30", - "last_updated": "2026-03-30", + "release_date": "2023-12-11", + "last_updated": "2023-12-11", "cost": { - "input": 0.25, - "output": 0.75, - "cache_read": 0.025 + "input": 0.1, + "output": 0 }, "type": "chat" }, { - "id": "inception/mercury-2", - "name": "Mercury 2", - "display_name": "Mercury 2", + "id": "mistral/magistral-medium", + "name": "Magistral Medium (latest)", + "display_name": "Magistral Medium (latest)", "modalities": { "input": [ "text" @@ -123324,7 +132657,7 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -123333,20 +132666,20 @@ "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-03-06", + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-03-17", + "last_updated": "2025-03-20", "cost": { - "input": 0.25, - "output": 0.75, - "cache_read": 0.024999999999999998 + "input": 2, + "output": 5 }, "type": "chat" }, { - "id": "inception/mercury-coder-small", - "name": "Mercury Coder Small Beta", - "display_name": "Mercury Coder Small Beta", + "id": "mistral/ministral-3b", + "name": "Ministral 3B (latest)", + "display_name": "Ministral 3B (latest)", "modalities": { "input": [ "text" @@ -123356,8 +132689,8 @@ ] }, "limit": { - "context": 32000, - "output": 16384 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -123365,81 +132698,56 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-02-26", - "last_updated": "2026-05-01", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-04", "cost": { - "input": 0.25, - "output": 1 + "input": 0.04, + "output": 0.04 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-max", - "name": "GPT 5.1 Codex Max", - "display_name": "GPT 5.1 Codex Max", + "id": "mistral/pixtral-large", + "name": "Pixtral Large (latest)", + "display_name": "Pixtral Large (latest)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 128000, "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2024-11-04", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "openai/gpt-5.2-chat", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", + "id": "mistral/ministral-8b", + "name": "Ministral 8B (latest)", + "display_name": "Ministral 8B (latest)", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -123447,30 +132755,28 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, + "attachment": false, + "open_weights": true, "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2024-10-01", + "last_updated": "2024-10-04", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.18 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini-search-preview", - "name": "GPT 4o Mini Search Preview", - "display_name": "GPT 4o Mini Search Preview", + "id": "mistral/mixtral-8x22b-instruct", + "name": "Mixtral 8x22B", + "display_name": "Mixtral 8x22B", "modalities": { "input": [ "text" @@ -123480,42 +132786,40 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 64000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2025-01", - "last_updated": "2025-01", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-04-17", + "last_updated": "2024-04-17", "cost": { - "input": 0.15, - "output": 0.6 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "openai/codex-mini", - "name": "Codex Mini", - "display_name": "Codex Mini", + "id": "mistral/magistral-small", + "name": "Magistral Small", + "display_name": "Magistral Small", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -123523,64 +132827,57 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-05-16", - "last_updated": "2025-05-16", + "attachment": false, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-03-17", + "last_updated": "2025-03-17", "cost": { - "input": 1.5, - "output": 6, - "cache_read": 0.38 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "openai/gpt-5-chat", - "name": "GPT-5 Chat", - "display_name": "GPT-5 Chat", + "id": "mistral/codestral", + "name": "Codestral (latest)", + "display_name": "Codestral (latest)", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 256000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, + "attachment": false, + "open_weights": true, "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2024-05-29", + "last_updated": "2025-01-04", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "openai/gpt-5.3-chat", - "name": "GPT-5.3 Chat", - "display_name": "GPT-5.3 Chat", + "id": "mistral/pixtral-12b", + "name": "Pixtral 12B", + "display_name": "Pixtral 12B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -123588,42 +132885,40 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-03-03", - "last_updated": "2026-03-06", + "open_weights": true, + "knowledge": "2024-09", + "release_date": "2024-09-01", + "last_updated": "2024-09-01", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "openai/gpt-5.2-pro", - "name": "GPT 5.2 ", - "display_name": "GPT 5.2 ", + "id": "mistral/mistral-small", + "name": "Mistral Small (latest)", + "display_name": "Mistral Small (latest)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -123631,41 +132926,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 21, - "output": 168 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "openai/text-embedding-3-large", - "name": "text-embedding-3-large", - "display_name": "text-embedding-3-large", + "id": "morph/morph-v3-fast", + "name": "Morph v3 Fast", + "display_name": "Morph v3 Fast", "modalities": { "input": [ "text" @@ -123675,8 +132950,8 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 16000, + "output": 16000 }, "temperature": false, "tool_call": false, @@ -123685,130 +132960,80 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 0.13, - "output": 0 + "input": 0.8, + "output": 1.2 }, - "type": "embedding" + "type": "chat" }, { - "id": "openai/gpt-5.5", - "name": "GPT 5.5", - "display_name": "GPT 5.5", + "id": "morph/morph-v3-large", + "name": "Morph v3 Large", + "display_name": "Morph v3 Large", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 32000, + "output": 32000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5 + "input": 0.9, + "output": 1.9 }, "type": "chat" }, { - "id": "openai/gpt-5.3-codex", - "name": "GPT 5.3 Codex", - "display_name": "GPT 5.3 Codex", + "id": "openai/text-embedding-3-large", + "name": "text-embedding-3-large", + "display_name": "text-embedding-3-large", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.13, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "openai/text-embedding-ada-002", - "name": "text-embedding-ada-002", - "display_name": "text-embedding-ada-002", + "id": "openai/gpt-4o-mini-search-preview", + "name": "GPT 4o Mini Search Preview", + "display_name": "GPT 4o Mini Search Preview", "modalities": { "input": [ "text" @@ -123818,23 +133043,24 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 128000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2022-12-15", - "last_updated": "2022-12-15", + "knowledge": "2023-09", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 0.1, - "output": 0 + "input": 0.15, + "output": 0.6 }, - "type": "embedding" + "type": "chat" }, { "id": "openai/gpt-5.2", @@ -123894,6 +133120,38 @@ }, "type": "chat" }, + { + "id": "openai/gpt-3.5-turbo", + "name": "GPT-3.5 Turbo", + "display_name": "GPT-3.5 Turbo", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16385, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2021-09", + "release_date": "2023-03-01", + "last_updated": "2023-03-01", + "cost": { + "input": 0.5, + "output": 1.5 + }, + "type": "chat" + }, { "id": "openai/o3-pro", "name": "o3 Pro", @@ -123944,9 +133202,9 @@ "type": "chat" }, { - "id": "openai/gpt-5.4-mini", - "name": "GPT 5.4 Mini", - "display_name": "GPT 5.4 Mini", + "id": "openai/gpt-5.4-nano", + "name": "GPT 5.4 Nano", + "display_name": "GPT 5.4 Nano", "modalities": { "input": [ "text", @@ -123994,73 +133252,47 @@ "release_date": "2026-03-17", "last_updated": "2026-03-17", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 0.19999999999999998, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "openai/gpt-5.4-nano", - "name": "GPT 5.4 Nano", - "display_name": "GPT 5.4 Nano", + "id": "openai/text-embedding-ada-002", + "name": "text-embedding-ada-002", + "display_name": "text-embedding-ada-002", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "release_date": "2022-12-15", + "last_updated": "2022-12-15", "cost": { - "input": 0.19999999999999998, - "output": 1.25, - "cache_read": 0.02 + "input": 0.1, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "openai/gpt-5.2-codex", - "name": "GPT-5.2-Codex", - "display_name": "GPT-5.2-Codex", + "id": "openai/gpt-5.5-pro", + "name": "GPT 5.5 Pro", + "display_name": "GPT 5.5 Pro", "modalities": { "input": [ "text", @@ -124072,7 +133304,7 @@ ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, "temperature": true, @@ -124083,34 +133315,16 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12", - "last_updated": "2025-12", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 30, + "output": 180 }, "type": "chat" }, @@ -124172,67 +133386,9 @@ "type": "chat" }, { - "id": "openai/gpt-5.1-thinking", - "name": "GPT 5.1 Thinking", - "display_name": "GPT 5.1 Thinking", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text", - "image" - ] - }, - "limit": { - "context": 400000, - "output": 128000 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 - }, - "type": "chat" - }, - { - "id": "openai/gpt-5.4-pro", - "name": "GPT 5.4 Pro", - "display_name": "GPT 5.4 Pro", + "id": "openai/gpt-5.2-pro", + "name": "GPT 5.2 ", + "display_name": "GPT 5.2 ", "modalities": { "input": [ "text", @@ -124244,7 +133400,7 @@ ] }, "limit": { - "context": 1050000, + "context": 400000, "output": 128000 }, "temperature": true, @@ -124275,18 +133431,19 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-03-05", - "last_updated": "2026-03-06", + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 30, - "output": 180 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo", - "name": "GPT-3.5 Turbo", - "display_name": "GPT-3.5 Turbo", + "id": "openai/gpt-3.5-turbo-instruct", + "name": "GPT-3.5 Turbo Instruct", + "display_name": "GPT-3.5 Turbo Instruct", "modalities": { "input": [ "text" @@ -124296,7 +133453,7 @@ ] }, "limit": { - "context": 16385, + "context": 8192, "output": 4096 }, "temperature": true, @@ -124310,146 +133467,8 @@ "release_date": "2023-03-01", "last_updated": "2023-03-01", "cost": { - "input": 0.5, - "output": 1.5 - }, - "type": "chat" - }, - { - "id": "openai/o3-deep-research", - "name": "o3-deep-research", - "display_name": "o3-deep-research", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 100000 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-06-26", - "last_updated": "2024-06-26", - "cost": { - "input": 10, - "output": 40, - "cache_read": 2.5 - }, - "type": "chat" - }, - { - "id": "openai/text-embedding-3-small", - "name": "text-embedding-3-small", - "display_name": "text-embedding-3-small", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 1536 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", - "cost": { - "input": 0.02, - "output": 0 - }, - "type": "embedding" - }, - { - "id": "openai/gpt-5.4", - "name": "GPT 5.4", - "display_name": "GPT 5.4", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1050000, - "output": 128000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-05", - "last_updated": "2026-03-06", - "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 1.5, + "output": 2 }, "type": "chat" }, @@ -124491,57 +133510,6 @@ }, "type": "chat" }, - { - "id": "openai/gpt-5-pro", - "name": "GPT-5 pro", - "display_name": "GPT-5 pro", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text", - "image" - ] - }, - "limit": { - "context": 400000, - "output": 272000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 15, - "output": 120 - }, - "type": "chat" - }, { "id": "openai/gpt-oss-safeguard-20b", "name": "gpt-oss-safeguard-20b", @@ -124572,86 +133540,14 @@ "cost": { "input": 0.08, "output": 0.3, - "cache_read": 0.04 - }, - "type": "chat" - }, - { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131072 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 0.1, - "output": 0.5 - }, - "type": "chat" - }, - { - "id": "openai/gpt-5.5-pro", - "name": "GPT 5.5 Pro", - "display_name": "GPT 5.5 Pro", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 128000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-04-24", - "cost": { - "input": 30, - "output": 180 + "cache_read": 0.04 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo-instruct", - "name": "GPT-3.5 Turbo Instruct", - "display_name": "GPT-3.5 Turbo Instruct", + "id": "openai/text-embedding-3-small", + "name": "text-embedding-3-small", + "display_name": "text-embedding-3-small", "modalities": { "input": [ "text" @@ -124662,28 +133558,27 @@ }, "limit": { "context": 8192, - "output": 4096 + "output": 1536 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2021-09", - "release_date": "2023-03-01", - "last_updated": "2023-03-01", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 1.5, - "output": 2 + "input": 0.02, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "openai/gpt-5.1-instant", - "name": "GPT-5.1 Instant", - "display_name": "GPT-5.1 Instant", + "id": "openai/gpt-5-pro", + "name": "GPT-5 pro", + "display_name": "GPT-5 pro", "modalities": { "input": [ "text", @@ -124696,27 +133591,21 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 272000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], + "default_enabled": true, + "mode": "fixed", + "effort": "high", "verbosity": "medium", "verbosity_options": [ "low", @@ -124732,16 +133621,15 @@ "release_date": "2025-08-07", "last_updated": "2025-08-07", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex", - "name": "GPT-5.1-Codex", - "display_name": "GPT-5.1-Codex", + "id": "openai/gpt-5.4", + "name": "GPT 5.4", + "display_name": "GPT 5.4", "modalities": { "input": [ "text", @@ -124753,7 +133641,7 @@ ] }, "limit": { - "context": 400000, + "context": 1050000, "output": 128000 }, "temperature": true, @@ -124772,7 +133660,8 @@ "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -124785,20 +133674,19 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2026-03-05", + "last_updated": "2026-03-06", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "openai/gpt-5.4-mini", + "name": "GPT 5.4 Mini", + "display_name": "GPT 5.4 Mini", "modalities": { "input": [ "text", @@ -124810,30 +133698,52 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "openai/gpt-5.1-thinking", + "name": "GPT 5.1 Thinking", + "display_name": "GPT 5.1 Thinking", "modalities": { "input": [ "text", @@ -124841,41 +133751,8 @@ "pdf" ], "output": [ - "text" - ] - }, - "limit": { - "context": 1047576, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, - "type": "chat" - }, - { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", - "modalities": { - "input": [ "text", "image" - ], - "output": [ - "text" ] }, "limit": { @@ -124886,16 +133763,16 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ - "minimal", + "none", "low", "medium", "high" @@ -124911,20 +133788,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", + "knowledge": "2024-10", "release_date": "2025-08-07", "last_updated": "2025-08-07", "cost": { "input": 1.25, "output": 10, - "cache_read": 0.125 + "cache_read": 0.13 }, "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "openai/gpt-5.1-instant", + "name": "GPT-5.1 Instant", + "display_name": "GPT-5.1 Instant", "modalities": { "input": [ "text", @@ -124932,7 +133809,8 @@ "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { @@ -124941,52 +133819,24 @@ }, "temperature": true, "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", - "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 - }, - "type": "chat" - }, - { - "id": "openai/o3", - "name": "o3", - "display_name": "o3", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 100000 - }, - "temperature": false, - "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -124996,58 +133846,61 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "openai/gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "openai/codex-mini", + "name": "Codex Mini", + "display_name": "Codex Mini", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 100000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-10", + "release_date": "2025-05-16", + "last_updated": "2025-05-16", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.03 + "input": 1.5, + "output": 6, + "cache_read": 0.38 }, "type": "chat" }, { - "id": "openai/gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "openai/gpt-5.1-codex-max", + "name": "GPT 5.1 Codex Max", + "display_name": "GPT 5.1 Codex Max", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -125057,20 +133910,20 @@ "context": 400000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ - "minimal", + "none", "low", "medium", "high" @@ -125084,70 +133937,22 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { "input": 1.25, "output": 10, - "cache_read": 0.125 - }, - "type": "chat" - }, - { - "id": "openai/o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 100000 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", - "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "cache_read": 0.13 }, "type": "chat" }, { - "id": "openai/o1", - "name": "o1", - "display_name": "o1", + "id": "openai/gpt-5.5", + "name": "GPT 5.5", + "display_name": "GPT 5.5", "modalities": { "input": [ "text", @@ -125159,10 +133964,10 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1000000, + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -125175,6 +133980,13 @@ "mode": "effort", "effort": "medium", "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -125184,34 +133996,34 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 5, + "output": 30, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "openai/gpt-5.4-pro", + "name": "GPT 5.4 Pro", + "display_name": "GPT 5.4 Pro", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1050000, + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -125222,8 +134034,14 @@ "supported": true, "default_enabled": true, "mode": "effort", - "effort": "medium", + "effort": "high", "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -125233,20 +134051,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2026-03-05", + "last_updated": "2026-03-06", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 30, + "output": 180 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "openai/gpt-5.1-codex", + "name": "GPT-5.1-Codex", + "display_name": "GPT-5.1-Codex", "modalities": { "input": [ "text", @@ -125257,91 +134073,24 @@ "text" ] }, - "limit": { - "context": 128000, - "output": 16384 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", - "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 - }, - "type": "chat" - }, - { - "id": "openai/gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", - "cost": { - "input": 10, - "output": 30 - }, - "type": "chat" - }, - { - "id": "openai/gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, "limit": { "context": 400000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ - "minimal", + "none", "low", "medium", "high" @@ -125357,24 +134106,25 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", + "knowledge": "2024-10", "release_date": "2025-08-07", "last_updated": "2025-08-07", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "openai/gpt-5.2-codex", + "name": "GPT-5.2-Codex", + "display_name": "GPT-5.2-Codex", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -125384,7 +134134,7 @@ "context": 400000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -125397,10 +134147,10 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "minimal", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -125413,66 +134163,37 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-10", + "release_date": "2025-12", + "last_updated": "2025-12", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "amazon/titan-embed-text-v2", - "name": "Titan Text Embeddings V2", - "display_name": "Titan Text Embeddings V2", + "id": "openai/gpt-5-chat", + "name": "GPT-5 Chat", + "display_name": "GPT-5 Chat", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 1536 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-04", - "last_updated": "2024-04", - "cost": { - "input": 0.02, - "output": 0 - }, - "type": "chat" - }, - { - "id": "amazon/nova-2-lite", - "name": "Nova 2 Lite", - "display_name": "Nova 2 Lite", - "modalities": { - "input": [ "text", "image" - ], - "output": [ - "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -125480,88 +134201,111 @@ "attachment": true, "open_weights": false, "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.3, - "output": 2.5 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "amazon/nova-pro", - "name": "Nova Pro", - "display_name": "Nova Pro", + "id": "openai/gpt-5.3-codex", + "name": "GPT 5.3 Codex", + "display_name": "GPT 5.3 Codex", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0.8, - "output": 3.2, - "cache_read": 0.2 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "amazon/nova-lite", - "name": "Nova Lite", - "display_name": "Nova Lite", + "id": "openai/gpt-5.2-chat", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.06, - "output": 0.24, - "cache_read": 0.015 + "input": 1.75, + "output": 14, + "cache_read": 0.18 }, "type": "chat" }, { - "id": "amazon/nova-micro", - "name": "Nova Micro", - "display_name": "Nova Micro", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -125571,62 +134315,35 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", - "cost": { - "input": 0.035, - "output": 0.14, - "cache_read": 0.00875 - }, - "type": "chat" - }, - { - "id": "mistral/mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 60288, - "output": 16000 + "supported": true, + "default": true }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.04, - "output": 0.17 + "input": 0.1, + "output": 0.5 }, "type": "chat" }, { - "id": "mistral/ministral-14b", - "name": "Ministral 14B", - "display_name": "Ministral 14B", + "id": "openai/o3-deep-research", + "name": "o3-deep-research", + "display_name": "o3-deep-research", "modalities": { "input": [ "text", @@ -125638,64 +134355,50 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, "knowledge": "2024-10", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", - "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" - }, - { - "id": "mistral/codestral-embed", - "name": "Codestral Embed", - "display_name": "Codestral Embed", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 1536 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "release_date": "2024-06-26", + "last_updated": "2024-06-26", "cost": { - "input": 0.15, - "output": 0 + "input": 10, + "output": 40, + "cache_read": 2.5 }, "type": "chat" }, { - "id": "mistral/mistral-medium", - "name": "Mistral Medium 3.1", - "display_name": "Mistral Medium 3.1", + "id": "openai/gpt-5.3-chat", + "name": "GPT-5.3 Chat", + "display_name": "GPT-5.3 Chat", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -125703,212 +134406,135 @@ }, "limit": { "context": 128000, - "output": 64000 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "release_date": "2026-03-03", + "last_updated": "2026-03-06", "cost": { - "input": 0.4, - "output": 2 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "mistral/mistral-embed", - "name": "Mistral Embed", - "display_name": "Mistral Embed", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 400000, + "output": 128000 }, "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2023-12-11", - "last_updated": "2023-12-11", - "cost": { - "input": 0.1, - "output": 0 - }, - "type": "chat" - }, - { - "id": "mistral/devstral-2", - "name": "Devstral 2", - "display_name": "Devstral 2", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 256000 - }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", - "type": "chat" - }, - { - "id": "mistral/mistral-large-3", - "name": "Mistral Large 3", - "display_name": "Mistral Large 3", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 256000 + "supported": true, + "default": true }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.5, - "output": 1.5 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "mistral/devstral-small-2", - "name": "Devstral Small 2", - "display_name": "Devstral Small 2", + "id": "openai/o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", - "type": "chat" - }, - { - "id": "mistral/devstral-small", - "name": "Devstral Small 1.1", - "display_name": "Devstral Small 1.1", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 64000 + "supported": true, + "default": true }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", - "cost": { - "input": 0.1, - "output": 0.3 - }, - "type": "chat" - }, - { - "id": "mistral/ministral-8b", - "name": "Ministral 8B (latest)", - "display_name": "Ministral 8B (latest)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 128000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-04", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.1, - "output": 0.1 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "mistral/magistral-medium", - "name": "Magistral Medium (latest)", - "display_name": "Magistral Medium (latest)", + "id": "openai/o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" @@ -125918,30 +134544,45 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-03-17", - "last_updated": "2025-03-20", + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 2, - "output": 5 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "mistral/mistral-small", - "name": "Mistral Small (latest)", - "display_name": "Mistral Small (latest)", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ "text", @@ -125952,63 +134593,101 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "mistral/magistral-small", - "name": "Magistral Small", - "display_name": "Magistral Small", + "id": "openai/o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-03-17", - "last_updated": "2025-03-17", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.5, - "output": 1.5 + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 }, "type": "chat" }, { - "id": "mistral/pixtral-12b", - "name": "Pixtral 12B", - "display_name": "Pixtral 12B", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ "text", @@ -126019,8 +134698,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -126028,52 +134707,71 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-09-01", - "last_updated": "2024-09-01", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "mistral/mixtral-8x22b-instruct", - "name": "Mixtral 8x22B", - "display_name": "Mixtral 8x22B", + "id": "openai/o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 64000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-04-17", - "last_updated": "2024-04-17", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 2, - "output": 6 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "mistral/pixtral-large", - "name": "Pixtral Large (latest)", - "display_name": "Pixtral Large (latest)", + "id": "openai/gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ "text", @@ -126085,7 +134783,7 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -126093,23 +134791,25 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2024-11-04", + "open_weights": false, + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 2, - "output": 6 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "mistral/ministral-3b", - "name": "Ministral 3B (latest)", - "display_name": "Ministral 3B (latest)", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -126117,124 +134817,155 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-04", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.04, - "output": 0.04 + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "mistral/codestral", - "name": "Codestral (latest)", - "display_name": "Codestral (latest)", + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-05-29", - "last_updated": "2025-01-04", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "meta/llama-3.2-1b", - "name": "Llama 3.2 1B Instruct", - "display_name": "Llama 3.2 1B Instruct", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1047576, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2024-09-18", - "last_updated": "2024-09-18", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "meta/llama-3.1-8b", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.03, - "output": 0.05 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "meta/llama-3.2-90b", - "name": "Llama 3.2 90B Vision Instruct", - "display_name": "Llama 3.2 90B Vision Instruct", + "id": "openai/gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ "text", @@ -126245,32 +134976,57 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.72, - "output": 0.72 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "meta/llama-3.2-3b", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -126278,28 +135034,29 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2024-09-18", - "last_updated": "2024-09-18", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 0.15, - "output": 0.15 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "meta/llama-3.2-11b", - "name": "Llama 3.2 11B Vision Instruct", - "display_name": "Llama 3.2 11B Vision Instruct", + "id": "amazon/nova-2-lite", + "name": "Nova 2 Lite", + "display_name": "Nova 2 Lite", "modalities": { "input": [ "text", @@ -126310,29 +135067,30 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 1000000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.16, - "output": 0.16 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "meta/llama-3.1-70b", - "name": "Llama 3.1 70B Instruct", - "display_name": "Llama 3.1 70B Instruct", + "id": "amazon/titan-embed-text-v2", + "name": "Titan Text Embeddings V2", + "display_name": "Titan Text Embeddings V2", "modalities": { "input": [ "text" @@ -126342,40 +135100,41 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2024-04", + "last_updated": "2024-04", "cost": { - "input": 0.4, - "output": 0.4 + "input": 0.02, + "output": 0 }, "type": "chat" }, { - "id": "meta/llama-3.3-70b", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "amazon/nova-lite", + "name": "Nova Lite", + "display_name": "Nova Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 300000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -126383,24 +135142,24 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0, - "output": 0 + "input": 0.06, + "output": 0.24, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "meta/llama-4-maverick", - "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", - "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "id": "amazon/nova-micro", + "name": "Nova Micro", + "display_name": "Nova Micro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -126408,40 +135167,42 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "attachment": false, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0, - "output": 0 + "input": 0.035, + "output": 0.14, + "cache_read": 0.00875 }, "type": "chat" }, { - "id": "meta/llama-4-scout", - "name": "Llama-4-Scout-17B-16E-Instruct-FP8", - "display_name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "id": "amazon/nova-pro", + "name": "Nova Pro", + "display_name": "Nova Pro", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 300000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -126449,91 +135210,78 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0, - "output": 0 + "input": 0.8, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "vercel/v0-1.5-md", - "name": "v0-1.5-md", - "display_name": "v0-1.5-md", + "id": "recraft/recraft-v2", + "name": "Recraft V2", + "display_name": "Recraft V2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 512, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-06-09", - "last_updated": "2025-06-09", - "cost": { - "input": 3, - "output": 15 - }, + "release_date": "2024-03", + "last_updated": "2024-03", "type": "chat" }, { - "id": "vercel/v0-1.0-md", - "name": "v0-1.0-md", - "display_name": "v0-1.0-md", + "id": "recraft/recraft-v3", + "name": "Recraft V3", + "display_name": "Recraft V3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 512, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 3, - "output": 15 - }, + "release_date": "2024-10", + "last_updated": "2024-10", "type": "chat" }, { - "id": "minimax/minimax-m2.7", - "name": "Minimax M2.7", - "display_name": "Minimax M2.7", + "id": "minimax/minimax-m2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -126541,7 +135289,7 @@ }, "limit": { "context": 204800, - "output": 131000 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -126552,23 +135300,19 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "interleaved": true } }, - "attachment": true, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": false, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { "input": 0.3, "output": 1.2, - "cache_read": 0.06, - "cache_write": 0.375 + "cache_read": 0.03, + "cache_write": 0.38 }, "type": "chat" }, @@ -126660,9 +135404,9 @@ "type": "chat" }, { - "id": "minimax/minimax-m2.1", - "name": "MiniMax M2.1", - "display_name": "MiniMax M2.1", + "id": "minimax/minimax-m2.1-lightning", + "name": "MiniMax M2.1 Lightning", + "display_name": "MiniMax M2.1 Lightning", "modalities": { "input": [ "text" @@ -126681,12 +135425,6 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true - } - }, "attachment": false, "open_weights": false, "knowledge": "2024-10", @@ -126694,16 +135432,16 @@ "last_updated": "2025-10-27", "cost": { "input": 0.3, - "output": 1.2, + "output": 2.4, "cache_read": 0.03, "cache_write": 0.38 }, "type": "chat" }, { - "id": "minimax/minimax-m2.1-lightning", - "name": "MiniMax M2.1 Lightning", - "display_name": "MiniMax M2.1 Lightning", + "id": "minimax/minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -126714,7 +135452,7 @@ }, "limit": { "context": 204800, - "output": 131072 + "output": 131000 }, "temperature": true, "tool_call": true, @@ -126722,26 +135460,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "release_date": "2026-02-12", + "last_updated": "2026-02-19", "cost": { "input": 0.3, - "output": 2.4, + "output": 1.2, "cache_read": 0.03, - "cache_write": 0.38 + "cache_write": 0.375 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "minimax/minimax-m2.7", + "name": "Minimax M2.7", + "display_name": "Minimax M2.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -126759,17 +135503,23 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, - "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-02-19", + "attachment": true, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { "input": 0.3, "output": 1.2, - "cache_read": 0.03, + "cache_read": 0.06, "cache_write": 0.375 }, "type": "chat" @@ -126813,6 +135563,39 @@ }, "type": "chat" }, + { + "id": "kwaipilot/kat-coder-pro-v2", + "name": "Kat Coder Pro V2", + "display_name": "Kat Coder Pro V2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-27", + "last_updated": "2026-03-30", + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 + }, + "type": "chat" + }, { "id": "kwaipilot/kat-coder-pro-v1", "name": "KAT-Coder-Pro V1", @@ -126843,9 +135626,43 @@ "type": "chat" }, { - "id": "kwaipilot/kat-coder-pro-v2", - "name": "Kat Coder Pro V2", - "display_name": "Kat Coder Pro V2", + "id": "nvidia/nemotron-nano-12b-v2-vl", + "name": "Nvidia Nemotron Nano 12B V2 VL", + "display_name": "Nvidia Nemotron Nano 12B V2 VL", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12", + "last_updated": "2024-12", + "cost": { + "input": 0.2, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "nvidia/nemotron-3-super-120b-a12b", + "name": "NVIDIA Nemotron 3 Super 120B A12B", + "display_name": "NVIDIA Nemotron 3 Super 120B A12B", "modalities": { "input": [ "text" @@ -126856,7 +135673,38 @@ }, "limit": { "context": 256000, - "output": 256000 + "output": 32000 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-18", + "last_updated": "2026-03-30", + "cost": { + "input": 0.15, + "output": 0.65 + }, + "type": "chat" + }, + { + "id": "nvidia/nemotron-nano-9b-v2", + "name": "Nvidia Nemotron Nano 9B V2", + "display_name": "Nvidia Nemotron Nano 9B V2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -126866,25 +135714,56 @@ }, "attachment": false, "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-30", + "knowledge": "2024-10", + "release_date": "2025-08-18", + "last_updated": "2025-08-18", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.04, + "output": 0.16 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-lite-preview-09-2025", - "name": "Gemini 2.5 Flash Lite Preview 09-25", - "display_name": "Gemini 2.5 Flash Lite Preview 09-25", + "id": "nvidia/nemotron-3-nano-30b-a3b", + "name": "Nemotron 3 Nano 30B A3B", + "display_name": "Nemotron 3 Nano 30B A3B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12", + "last_updated": "2024-12", + "cost": { + "input": 0.06, + "output": 0.24 + }, + "type": "chat" + }, + { + "id": "anthropic/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -126892,8 +135771,8 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -126905,37 +135784,169 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "budget", + "mode": "mixed", "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, + "min": 1024, "unit": "tokens" }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.01 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5 + } }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-lite-preview", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "anthropic/claude-opus-4.6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02", + "last_updated": "2026-02", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "type": "chat" + }, + { + "id": "anthropic/claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "cost": { + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + }, + "type": "chat" + }, + { + "id": "anthropic/claude-opus-4.5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ "text", @@ -126947,8 +135958,8 @@ ] }, "limit": { - "context": 1000000, - "output": 65000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -126958,76 +135969,61 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true } }, "attachment": true, "open_weights": false, - "release_date": "2026-03-03", - "last_updated": "2026-03-06", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "google/gemini-3-pro-image", - "name": "Nano Banana Pro (Gemini 3 Pro Image)", - "display_name": "Nano Banana Pro (Gemini 3 Pro Image)", + "id": "anthropic/claude-3.5-sonnet-20240620", + "name": "Claude 3.5 Sonnet (2024-06-20)", + "display_name": "Claude 3.5 Sonnet (2024-06-20)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 65536, - "output": 32768 + "context": 200000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-09", - "last_updated": "2025-09", + "knowledge": "2024-04", + "release_date": "2024-06-20", + "last_updated": "2024-06-20", "cost": { - "input": 2, - "output": 120 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "google/gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "anthropic/claude-opus-4.7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", @@ -127040,52 +136036,58 @@ }, "limit": { "context": 1000000, - "output": 64000 + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ "low", - "high" + "medium", + "high", + "xhigh" ], + "interleaved": true, "summaries": true, - "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-19", - "last_updated": "2026-02-24", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "google/gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "anthropic/claude-3.5-haiku", + "name": "Claude Haiku 3.5", + "display_name": "Claude Haiku 3.5", "modalities": { "input": [ "text", "image", - "video", - "audio", "pdf" ], "output": [ @@ -127093,111 +136095,104 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "google/imagen-4.0-ultra-generate-001", - "name": "Imagen 4 Ultra", - "display_name": "Imagen 4 Ultra", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 200000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-05-24", - "last_updated": "2025-05-24", - "type": "imageGeneration" + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "type": "chat" }, { - "id": "google/gemini-embedding-001", - "name": "Gemini Embedding 001", - "display_name": "Gemini Embedding 001", + "id": "anthropic/claude-3-opus", + "name": "Claude Opus 3", + "display_name": "Claude Opus 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 200000, + "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "knowledge": "2023-08-31", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", "cost": { - "input": 0.15, - "output": 0 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, - "type": "embedding" + "type": "chat" }, { - "id": "google/gemma-4-31b-it", - "name": "Gemma 4 31B IT", - "display_name": "Gemma 4 31B IT", + "id": "anthropic/claude-opus-4", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ "text", @@ -127209,8 +136204,8 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -127220,152 +136215,167 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-03", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.14, - "output": 0.39999999999999997 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-image", - "name": "Nano Banana (Gemini 2.5 Flash Image)", - "display_name": "Nano Banana (Gemini 2.5 Flash Image)", + "id": "anthropic/claude-opus-4.1", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 200000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-03-20", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.3, - "output": 2.5 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "google/text-embedding-005", - "name": "Text Embedding 005", - "display_name": "Text Embedding 005", + "id": "anthropic/claude-3.5-sonnet", + "name": "Claude Sonnet 3.5 v2", + "display_name": "Claude Sonnet 3.5 v2", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 200000, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-08", - "last_updated": "2024-08", + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.03, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "google/text-multilingual-embedding-002", - "name": "Text Multilingual Embedding 002", - "display_name": "Text Multilingual Embedding 002", + "id": "anthropic/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 200000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-03", - "last_updated": "2024-03", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.03, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-image-preview", - "name": "Gemini 3.1 Flash Image Preview (Nano Banana 2)", - "display_name": "Gemini 3.1 Flash Image Preview (Nano Banana 2)", + "id": "anthropic/claude-3-haiku", + "name": "Claude Haiku 3", + "display_name": "Claude Haiku 3", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-02-26", - "last_updated": "2026-03-06", + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", "cost": { - "input": 0.5, - "output": 3 + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "google/gemini-3.1-flash-lite", - "name": "Gemini 3.1 Flash Lite", - "display_name": "Gemini 3.1 Flash Lite", + "id": "anthropic/claude-3.7-sonnet", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", "modalities": { "input": [ "text", @@ -127377,35 +136387,52 @@ ] }, "limit": { - "context": 1000000, - "output": 65000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-05-07", - "last_updated": "2026-05-08", + "knowledge": "2024-10-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.03 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "google/gemini-3-flash", - "name": "Gemini 3 Flash", - "display_name": "Gemini 3 Flash", + "id": "google/gemma-4-26b-a4b-it", + "name": "Gemma 4 26B A4B IT", + "display_name": "Gemma 4 26B A4B IT", "modalities": { "input": [ "text", @@ -127417,8 +136444,8 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -127426,63 +136453,55 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "release_date": "2026-04-02", + "last_updated": "2026-04-03", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 + "input": 0.13, + "output": 0.39999999999999997 }, "type": "chat" }, { - "id": "google/imagen-4.0-generate-001", - "name": "Imagen 4", - "display_name": "Imagen 4", + "id": "google/gemini-3.1-flash-lite", + "name": "Gemini 3.1 Flash Lite", + "display_name": "Gemini 3.1 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 1000000, + "output": 65000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "type": "imageGeneration" + "release_date": "2026-05-07", + "last_updated": "2026-05-08", + "cost": { + "input": 0.25, + "output": 1.5, + "cache_read": 0.03 + }, + "type": "chat" }, { "id": "google/gemini-2.5-flash-preview-09-2025", @@ -127544,36 +136563,63 @@ "type": "chat" }, { - "id": "google/gemini-embedding-2", - "name": "Gemini Embedding 2", - "display_name": "Gemini Embedding 2", + "id": "google/imagen-4.0-fast-generate-001", + "name": "Imagen 4 Fast", + "display_name": "Imagen 4 Fast", "modalities": { "input": [ "text" ], "output": [ + "image" + ] + }, + "limit": { + "context": 480, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-06", + "last_updated": "2025-06", + "type": "imageGeneration" + }, + { + "id": "google/imagen-4.0-generate-001", + "name": "Imagen 4", + "display_name": "Imagen 4", + "modalities": { + "input": [ "text" + ], + "output": [ + "image" ] }, "limit": { - "context": 8192, + "context": 480, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-03-10", - "last_updated": "2026-03-23", - "type": "chat" + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "type": "imageGeneration" }, { - "id": "google/gemma-4-26b-a4b-it", - "name": "Gemma 4 26B A4B IT", - "display_name": "Gemma 4 26B A4B IT", + "id": "google/gemma-4-31b-it", + "name": "Gemma 4 31B IT", + "display_name": "Gemma 4 31B IT", "modalities": { "input": [ "text", @@ -127599,42 +136645,54 @@ "release_date": "2026-04-02", "last_updated": "2026-04-03", "cost": { - "input": 0.13, + "input": 0.14, "output": 0.39999999999999997 }, "type": "chat" }, { - "id": "google/imagen-4.0-fast-generate-001", - "name": "Imagen 4 Fast", - "display_name": "Imagen 4 Fast", + "id": "google/gemini-3.1-flash-image-preview", + "name": "Gemini 3.1 Flash Image Preview (Nano Banana 2)", + "display_name": "Gemini 3.1 Flash Image Preview (Nano Banana 2)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ + "text", "image" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-06", - "last_updated": "2025-06", + "release_date": "2026-02-26", + "last_updated": "2026-03-06", + "cost": { + "input": 0.5, + "output": 3 + }, "type": "imageGeneration" }, { - "id": "google/gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "google/gemini-2.5-flash-lite-preview-09-2025", + "name": "Gemini 2.5 Flash Lite Preview 09-25", + "display_name": "Gemini 2.5 Flash Lite Preview 09-25", "modalities": { "input": [ "text", @@ -127679,8 +136737,8 @@ "attachment": true, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { "input": 0.1, "output": 0.4, @@ -127689,78 +136747,9 @@ "type": "chat" }, { - "id": "google/gemini-2.5-flash-image-preview", - "name": "Nano Banana Preview (Gemini 2.5 Flash Image Preview)", - "display_name": "Nano Banana Preview (Gemini 2.5 Flash Image Preview)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text", - "image" - ] - }, - "limit": { - "context": 32768, - "output": 32768 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-03-20", - "cost": { - "input": 0.3, - "output": 2.5 - }, - "type": "imageGeneration" - }, - { - "id": "google/gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash Lite", - "display_name": "Gemini 2.0 Flash Lite", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1048576, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", - "cost": { - "input": 0.075, - "output": 0.3 - }, - "type": "chat" - }, - { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "google/gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ "text", @@ -127781,19 +136770,18 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "budget", "budget": { "default": -1, - "min": 0, + "min": 512, "max": 24576, "auto": -1, - "off": 0, "unit": "tokens" }, "summaries": true, @@ -127806,26 +136794,25 @@ "attachment": true, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.03, - "input_audio": 1 + "input": 0.1, + "output": 0.4, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "google/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ "text", "image", - "audio", "video", + "audio", "pdf" ], "output": [ @@ -127833,8 +136820,8 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -127846,14 +136833,12 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ @@ -127864,109 +136849,77 @@ "attachment": true, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 4, + "output": 18, + "cache_read": 0.4 } }, "type": "chat" }, { - "id": "google/gemini-2.0-flash", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "google/gemini-embedding-2", + "name": "Gemini Embedding 2", + "display_name": "Gemini Embedding 2", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 8192, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", - "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 - }, + "release_date": "2026-03-10", + "last_updated": "2026-03-23", "type": "chat" }, { - "id": "moonshotai/kimi-k2-turbo", - "name": "Kimi K2 Turbo", - "display_name": "Kimi K2 Turbo", + "id": "google/gemini-3-pro-image", + "name": "Nano Banana Pro (Gemini 3 Pro Image)", + "display_name": "Nano Banana Pro (Gemini 3 Pro Image)", "modalities": { "input": [ "text" ], "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 16384 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-08", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", - "cost": { - "input": 2.4, - "output": 10 - }, - "type": "chat" - }, - { - "id": "moonshotai/kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", - "modalities": { - "input": [ "text", - "image", - "video" - ], - "output": [ - "text" + "image" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 65536, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -127974,40 +136927,48 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-26", - "last_updated": "2026-01-26", + "attachment": false, + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 0.6, - "output": 1.2 + "input": 2, + "output": 120 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking-turbo", - "name": "Kimi K2 Thinking Turbo", - "display_name": "Kimi K2 Thinking Turbo", + "id": "google/gemini-3-flash", + "name": "Gemini 3 Flash", + "display_name": "Gemini 3 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262114, - "output": 262114 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -128018,36 +136979,50 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "knowledge": "2025-03", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 1.15, - "output": 8, - "cache_read": 0.15 + "input": 0.5, + "output": 3, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "google/gemini-2.5-flash-image-preview", + "name": "Nano Banana Preview (Gemini 2.5 Flash Image Preview)", + "display_name": "Nano Banana Preview (Gemini 2.5 Flash Image Preview)", "modalities": { "input": [ "text" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": false, @@ -128056,19 +137031,19 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-03-20", "cost": { - "input": 0.6, + "input": 0.3, "output": 2.5 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "moonshotai/kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "google/gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ "text", @@ -128080,8 +137055,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1000000, + "output": 65000 }, "temperature": true, "tool_call": true, @@ -128095,31 +137070,34 @@ } }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-20", - "last_updated": "2026-04-24", + "open_weights": false, + "release_date": "2026-03-03", + "last_updated": "2026-03-06", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "cache_write": 1 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "google/gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 216144, - "output": 216144 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -128130,62 +137108,95 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "release_date": "2026-02-19", + "last_updated": "2026-02-24", "cost": { - "input": 0.47, - "output": 2, - "cache_read": 0.14 + "input": 2, + "output": 12, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "google/imagen-4.0-ultra-generate-001", + "name": "Imagen 4 Ultra", + "display_name": "Imagen 4 Ultra", "modalities": { "input": [ "text" ], "output": [ + "image" + ] + }, + "limit": { + "context": 480, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-05-24", + "last_updated": "2025-05-24", + "type": "imageGeneration" + }, + { + "id": "google/gemini-2.5-flash-image", + "name": "Nano Banana (Gemini 2.5 Flash Image)", + "display_name": "Nano Banana (Gemini 2.5 Flash Image)", + "modalities": { + "input": [ "text" + ], + "output": [ + "text", + "image" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-14", - "last_updated": "2025-07-14", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-03-20", "cost": { - "input": 1, - "output": 3 + "input": 0.3, + "output": 2.5 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "interfaze/interfaze-beta", - "name": "Interfaze Beta", - "display_name": "Interfaze Beta", + "id": "google/gemini-embedding-001", + "name": "Gemini Embedding 001", + "display_name": "Gemini Embedding 001", "modalities": { "input": [ "text" @@ -128195,130 +137206,96 @@ ] }, "limit": { - "context": 1000000, - "output": 32000 + "context": 8192, + "output": 1536 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-10-07", - "last_updated": "2026-04-29", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 1.5, - "output": 3.5 + "input": 0.15, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "anthropic/claude-3.5-sonnet-20240620", - "name": "Claude 3.5 Sonnet (2024-06-20)", - "display_name": "Claude 3.5 Sonnet (2024-06-20)", + "id": "google/text-multilingual-embedding-002", + "name": "Text Multilingual Embedding 002", + "display_name": "Text Multilingual Embedding 002", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-06-20", - "last_updated": "2024-06-20", + "release_date": "2024-03", + "last_updated": "2024-03", "cost": { - "input": 3, - "output": 15 + "input": 0.03, + "output": 0 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "google/text-embedding-005", + "name": "Text Embedding 005", + "display_name": "Text Embedding 005", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02", - "last_updated": "2026-02", + "release_date": "2024-08", + "last_updated": "2024-08", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.03, + "output": 0 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "google/gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -128326,59 +137303,36 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 1048576, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -128386,8 +137340,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -128398,30 +137352,46 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 18.75 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4.5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "google/gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "display_name": "Gemini 2.0 Flash Lite", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -128429,42 +137399,35 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -128472,148 +137435,110 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", + "default_enabled": true, + "mode": "budget", "budget": { - "min": 1024, + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, "unit": "tokens" }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ], "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5 + "input": 2.5, + "output": 15, + "cache_read": 0.25 } }, "type": "chat" }, { - "id": "anthropic/claude-3-opus", - "name": "Claude Opus 3", - "display_name": "Claude Opus 3", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", - "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" - }, - { - "id": "anthropic/claude-3.5-haiku", - "name": "Claude Haiku 3.5", - "display_name": "Claude Haiku 3.5", + "id": "vercel/v0-1.0-md", + "name": "v0-1.0-md", + "display_name": "v0-1.0-md", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "vercel/v0-1.5-md", + "name": "v0-1.5-md", + "display_name": "v0-1.5-md", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 128000, "output": 32000 }, "temperature": true, @@ -128624,70 +137549,62 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-06-09", + "last_updated": "2025-06-09", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "anthropic/claude-3-haiku", - "name": "Claude Haiku 3", - "display_name": "Claude Haiku 3", + "id": "deepseek/deepseek-v3.2-exp", + "name": "DeepSeek V3.2 Exp", + "display_name": "DeepSeek V3.2 Exp", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-13", - "last_updated": "2024-03-13", + "knowledge": "2025-09", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 + "input": 0.27, + "output": 0.4 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "deepseek/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -128695,166 +137612,153 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-04-23", + "last_updated": "2026-04-24", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "deepseek/deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 163842, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.27, + "output": 0.4, + "cache_read": 0.22 }, "type": "chat" }, { - "id": "anthropic/claude-3.5-sonnet", - "name": "Claude Sonnet 3.5 v2", - "display_name": "Claude Sonnet 3.5 v2", + "id": "deepseek/deepseek-v3", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 163840, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2024-07", + "release_date": "2024-12-26", + "last_updated": "2024-12-26", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.77, + "output": 0.77 }, "type": "chat" }, { - "id": "anthropic/claude-3.7-sonnet", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "deepseek/deepseek-v3.2-thinking", + "name": "DeepSeek V3.2 Thinking", + "display_name": "DeepSeek V3.2 Thinking", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 128000, "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] + "interleaved": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.28, + "output": 0.42, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.1", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "deepseek/deepseek-v3.1", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 163840, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -128862,23 +137766,21 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.3, + "output": 1 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2.5-pro", - "name": "MiMo V2.5 Pro", - "display_name": "MiMo V2.5 Pro", + "id": "deepseek/deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -128888,8 +137790,8 @@ ] }, "limit": { - "context": 1050000, - "output": 131000 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -128897,35 +137799,43 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-22", - "last_updated": "2026-05-01", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-04-23", + "last_updated": "2026-04-24", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.19999999999999998 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2.5", - "name": "MiMo M2.5", - "display_name": "MiMo M2.5", + "id": "deepseek/deepseek-v3.1-terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 131100 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -128933,21 +137843,21 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-22", - "last_updated": "2026-05-01", + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 0.39999999999999997, - "output": 2, - "cache_read": 0.08 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-pro", - "name": "MiMo V2 Pro", - "display_name": "MiMo V2 Pro", + "id": "deepseek/deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -128957,8 +137867,8 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -128966,21 +137876,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": false, - "release_date": "2026-03-18", - "last_updated": "2026-03-20", + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.19999999999999998 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash", - "name": "MiMo V2 Flash", - "display_name": "MiMo V2 Flash", + "id": "perplexity/sonar-reasoning", + "name": "Sonar Reasoning", + "display_name": "Sonar Reasoning", "modalities": { "input": [ "text" @@ -128990,127 +137911,129 @@ ] }, "limit": { - "context": 262144, - "output": 32000 + "context": 127000, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2025-09", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.1, - "output": 0.29 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "bytedance/seed-1.6", - "name": "Seed 1.6", - "display_name": "Seed 1.6", + "id": "perplexity/sonar", + "name": "Sonar", + "display_name": "Sonar", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 127000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-09", - "last_updated": "2025-09", + "knowledge": "2025-02", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.05 + "input": 1, + "output": 1 }, "type": "chat" }, { - "id": "bytedance/seed-1.8", - "name": "Seed 1.8", - "display_name": "Seed 1.8", + "id": "perplexity/sonar-reasoning-pro", + "name": "Sonar Reasoning Pro", + "display_name": "Sonar Reasoning Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 127000, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-10", - "last_updated": "2025-10", + "knowledge": "2025-09", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.05 + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "meituan/longcat-flash-chat", - "name": "LongCat Flash Chat", - "display_name": "LongCat Flash Chat", + "id": "perplexity/sonar-pro", + "name": "Sonar Pro", + "display_name": "Sonar Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-30", - "last_updated": "2025-08-30", + "knowledge": "2025-09", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", + "cost": { + "input": 3, + "output": 15 + }, "type": "chat" }, { - "id": "meituan/longcat-flash-thinking", - "name": "LongCat Flash Thinking", - "display_name": "LongCat Flash Thinking", + "id": "arcee-ai/trinity-mini", + "name": "Trinity Mini", + "display_name": "Trinity Mini", "modalities": { "input": [ "text" @@ -129120,30 +138043,29 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, "knowledge": "2024-10", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "release_date": "2025-12", + "last_updated": "2025-12", "cost": { - "input": 0.15, - "output": 1.5 + "input": 0.05, + "output": 0.15 }, "type": "chat" }, { - "id": "meituan/longcat-flash-thinking-2601", - "name": "LongCat Flash Thinking 2601", - "display_name": "LongCat Flash Thinking 2601", + "id": "arcee-ai/trinity-large-thinking", + "name": "Trinity Large Thinking", + "display_name": "Trinity Large Thinking", "modalities": { "input": [ "text" @@ -129153,180 +138075,241 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 262100, + "output": 80000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-13", - "last_updated": "2026-03-13", + "open_weights": true, + "release_date": "2026-04-01", + "last_updated": "2026-04-03", + "cost": { + "input": 0.25, + "output": 0.8999999999999999 + }, "type": "chat" }, { - "id": "bfl/flux-pro-1.0-fill", - "name": "FLUX.1 Fill [pro]", - "display_name": "FLUX.1 Fill [pro]", + "id": "arcee-ai/trinity-large-preview", + "name": "Trinity Large Preview", + "display_name": "Trinity Large Preview", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 512, - "output": 8192 + "context": 131000, + "output": 131000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-10", - "last_updated": "2024-10", + "knowledge": "2024-10", + "release_date": "2025-01", + "last_updated": "2025-01", + "cost": { + "input": 0.25, + "output": 1 + }, "type": "chat" }, { - "id": "bfl/flux-pro-1.1", - "name": "FLUX1.1 [pro]", - "display_name": "FLUX1.1 [pro]", + "id": "alibaba/qwen3-max-preview", + "name": "Qwen3 Max Preview", + "display_name": "Qwen3 Max Preview", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 512, - "output": 8192 + "context": 262144, + "output": 32768 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2024-10", - "last_updated": "2024-10", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", + "cost": { + "input": 1.2, + "output": 6, + "cache_read": 0.24 + }, "type": "chat" }, { - "id": "bfl/flux-kontext-pro", - "name": "FLUX.1 Kontext Pro", - "display_name": "FLUX.1 Kontext Pro", + "id": "alibaba/qwen3.5-plus", + "name": "Qwen 3.5 Plus", + "display_name": "Qwen 3.5 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 512, - "output": 8192 + "context": 1000000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-06", - "last_updated": "2025-06", + "release_date": "2026-02-16", + "last_updated": "2026-02-19", + "cost": { + "input": 0.4, + "output": 2.4, + "cache_read": 0.04, + "cache_write": 0.5 + }, "type": "chat" }, { - "id": "bfl/flux-kontext-max", - "name": "FLUX.1 Kontext Max", - "display_name": "FLUX.1 Kontext Max", + "id": "alibaba/qwen3-vl-235b-a22b-instruct", + "name": "Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen3 VL 235B A22B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 512, - "output": 8192 + "context": 131072, + "output": 129024 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-06", - "last_updated": "2025-06", + "release_date": "2025-09-24", + "last_updated": "2026-05-01", + "cost": { + "input": 0.39999999999999997, + "output": 1.5999999999999999 + }, "type": "chat" }, { - "id": "bfl/flux-pro-1.1-ultra", - "name": "FLUX1.1 [pro] Ultra", - "display_name": "FLUX1.1 [pro] Ultra", + "id": "alibaba/qwen3.6-27b", + "name": "Qwen 3.6 27B", + "display_name": "Qwen 3.6 27B", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 512, - "output": 8192 + "context": 256000, + "output": 256000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-11", - "last_updated": "2024-11", + "release_date": "2026-04-22", + "last_updated": "2026-05-01", + "cost": { + "input": 0.6, + "output": 3.5999999999999996 + }, "type": "chat" - } - ] - }, - "minimax": { - "id": "minimax", - "name": "MiniMax (minimax.io)", - "display_name": "MiniMax (minimax.io)", - "api": "https://api.minimax.io/anthropic/v1", - "doc": "https://platform.minimax.io/docs/guides/quickstart", - "models": [ + }, { - "id": "MiniMax-M2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "alibaba/qwen3-vl-thinking", + "name": "Qwen3 VL Thinking", + "display_name": "Qwen3 VL Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 128000 + "context": 131072, + "output": 129024 }, "temperature": true, "tool_call": true, @@ -129336,23 +138319,30 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "knowledge": "2025-09", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.7, + "output": 8.4 }, "type": "chat" }, { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "alibaba/qwen-3-235b", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -129362,36 +138352,29 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 40960, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 0.13, + "output": 0.6 }, "type": "chat" }, { - "id": "MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "alibaba/qwen-3-32b", + "name": "Qwen 3.32B", + "display_name": "Qwen 3.32B", "modalities": { "input": [ "text" @@ -129401,8 +138384,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 40960, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -129410,33 +138393,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "MiniMax-M2.7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "alibaba/qwen3-max-thinking", + "name": "Qwen 3 Max Thinking", + "display_name": "Qwen 3 Max Thinking", "modalities": { "input": [ "text" @@ -129446,8 +138417,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -129468,20 +138439,20 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-01", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 1.2, + "output": 6, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "alibaba/qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ "text" @@ -129491,34 +138462,40 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.3, - "output": 1.2 + "input": 1.2, + "output": 6 }, "type": "chat" }, { - "id": "MiniMax-M2.5-highspeed", - "name": "MiniMax-M2.5-highspeed", - "display_name": "MiniMax-M2.5-highspeed", + "id": "alibaba/qwen3-coder-next", + "name": "Qwen3 Coder Next", + "display_name": "Qwen3 Coder Next", "modalities": { "input": [ "text" @@ -129528,8 +138505,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -129537,107 +138514,82 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-13", - "last_updated": "2026-02-13", + "open_weights": false, + "release_date": "2025-07-22", + "last_updated": "2026-02-19", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0.5, + "output": 1.2 }, "type": "chat" - } - ] - }, - "llmgateway": { - "id": "llmgateway", - "name": "LLM Gateway", - "display_name": "LLM Gateway", - "api": "https://api.llmgateway.io/v1", - "doc": "https://llmgateway.io/docs", - "models": [ + }, { - "id": "gpt-4o-mini-search-preview", - "name": "GPT-4o Mini Search Preview", - "display_name": "GPT-4o Mini Search Preview", + "id": "alibaba/qwen3-embedding-0.6b", + "name": "Qwen3 Embedding 0.6B", + "display_name": "Qwen3 Embedding 0.6B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.01, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "grok-4-1-fast-reasoning", - "name": "Grok 4.1 Fast Reasoning", - "display_name": "Grok 4.1 Fast Reasoning", + "id": "alibaba/qwen3-embedding-8b", + "name": "Qwen3 Embedding 8B", + "display_name": "Qwen3 Embedding 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 32768, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.05, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct (2507)", - "display_name": "Qwen3 235B A22B Instruct (2507)", + "id": "alibaba/qwen3-coder", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -129647,8 +138599,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 66536 }, "temperature": true, "tool_call": true, @@ -129656,50 +138608,67 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-08", - "last_updated": "2025-07-08", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.8, - "output": 2.4 + "input": 0.38, + "output": 1.53 }, "type": "chat" }, { - "id": "llama-4-scout", - "name": "Llama 4 Scout", - "display_name": "Llama 4 Scout", + "id": "alibaba/qwen3.6-plus", + "name": "Qwen 3.6 Plus", + "display_name": "Qwen 3.6 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-04-02", + "last_updated": "2026-04-03", "cost": { - "input": 0.18, - "output": 0.59 + "input": 0.5, + "output": 3, + "cache_read": 0.09999999999999999, + "cache_write": 0.625 }, "type": "chat" }, { - "id": "hermes-2-pro-llama-3-8b", - "name": "Hermes 2 Pro Llama 3 8B", - "display_name": "Hermes 2 Pro Llama 3 8B", + "id": "alibaba/qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ "text" @@ -129709,28 +138678,41 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2024-05-27", - "last_updated": "2024-05-27", + "knowledge": "2025-09", + "release_date": "2025-09-12", + "last_updated": "2025-09-12", "cost": { - "input": 0.14, - "output": 0.14 + "input": 0.15, + "output": 1.5 }, "type": "chat" }, { - "id": "qwen-coder-plus", - "name": "Qwen Coder Plus", - "display_name": "Qwen Coder Plus", + "id": "alibaba/qwen-3-14b", + "name": "Qwen3-14B", + "display_name": "Qwen3-14B", "modalities": { "input": [ "text" @@ -129740,72 +138722,76 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 40960, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2024-09-18", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.5, - "output": 1 + "input": 0.06, + "output": 0.24 }, "type": "chat" }, { - "id": "auto", - "name": "Auto Route", - "display_name": "Auto Route", + "id": "alibaba/qwen-3-30b", + "name": "Qwen3-30B-A3B", + "display_name": "Qwen3-30B-A3B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 40960, "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0, - "output": 0 + "input": 0.08, + "output": 0.29 }, "type": "chat" }, { - "id": "glm-4.6v-flashx", - "name": "GLM-4.6V FlashX", - "display_name": "GLM-4.6V FlashX", + "id": "alibaba/qwen3.5-flash", + "name": "Qwen 3.5 Flash", + "display_name": "Qwen 3.5 Flash", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -129813,52 +138799,66 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, "open_weights": false, - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0.04, + "input": 0.1, "output": 0.4, - "cache_read": 0 + "cache_read": 0.001, + "cache_write": 0.125 }, "type": "chat" }, { - "id": "gemma-2-27b-it-together", - "name": "Gemma 2 27B IT", - "display_name": "Gemma 2 27B IT", + "id": "alibaba/qwen3-vl-instruct", + "name": "Qwen3 VL Instruct", + "display_name": "Qwen3 VL Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 16384 + "context": 131072, + "output": 129024 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2024-06-27", - "last_updated": "2024-06-27", + "knowledge": "2025-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 0.08, - "output": 0.08 + "input": 0.7, + "output": 2.8 }, "type": "chat" }, { - "id": "codestral-2508", - "name": "Codestral", - "display_name": "Codestral", + "id": "alibaba/qwen3-embedding-4b", + "name": "Qwen3 Embedding 4B", + "display_name": "Qwen3 Embedding 4B", "modalities": { "input": [ "text" @@ -129868,28 +138868,28 @@ ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 32768, + "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "open_weights": false, + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.02, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "gemma-3-1b-it", - "name": "Gemma 3 1B IT", - "display_name": "Gemma 3 1B IT", + "id": "alibaba/qwen3-coder-30b-a3b", + "name": "Qwen 3 Coder 30B A3B Instruct", + "display_name": "Qwen 3 Coder 30B A3B Instruct", "modalities": { "input": [ "text" @@ -129899,28 +138899,30 @@ ] }, "limit": { - "context": 1000000, - "output": 16384 + "context": 160000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-03-12", - "last_updated": "2025-03-12", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.08, - "output": 0.3 + "input": 0.07, + "output": 0.27 }, "type": "chat" }, { - "id": "glm-4-32b-0414-128k", - "name": "GLM-4 32B (0414-128k)", - "display_name": "GLM-4 32B (0414-128k)", + "id": "alibaba/qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ "text" @@ -129930,8 +138932,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -129939,31 +138941,33 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-12", + "last_updated": "2025-09-12", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.09, + "output": 1.1 }, "type": "chat" }, { - "id": "seed-1-6-flash-250715", - "name": "Seed 1.6 Flash (250715)", - "display_name": "Seed 1.6 Flash (250715)", + "id": "alibaba/qwen-3.6-max-preview", + "name": "Qwen 3.6 Max Preview", + "display_name": "Qwen 3.6 Max Preview", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 240000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -129973,31 +138977,33 @@ }, "attachment": true, "open_weights": true, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "release_date": "2026-04-20", + "last_updated": "2026-04-24", "cost": { - "input": 0.07, - "output": 0.3, - "cache_read": 0.01 + "input": 1.3, + "output": 7.8, + "cache_read": 0.26, + "cache_write": 1.625 }, "type": "chat" }, { - "id": "seed-1-6-250615", - "name": "Seed 1.6 (250615)", - "display_name": "Seed 1.6 (250615)", + "id": "alibaba/qwen3-235b-a22b-thinking", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 262114, + "output": 262114 }, "temperature": true, "tool_call": true, @@ -130005,33 +139011,77 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", + "cost": { + "input": 0.3, + "output": 2.9 + }, + "type": "chat" + }, + { + "id": "alibaba/qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 1000000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": true, - "release_date": "2025-06-25", - "last_updated": "2025-06-25", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.05 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b-thinking", - "name": "Qwen3 VL 235B A22B Thinking", - "display_name": "Qwen3 VL 235B A22B Thinking", + "id": "xai/grok-4.20-reasoning", + "name": "Grok 4.20 Reasoning", + "display_name": "Grok 4.20 Reasoning", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, @@ -130039,43 +139089,32 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, - "open_weights": true, - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "open_weights": false, + "release_date": "2026-03-09", + "last_updated": "2026-03-23", "cost": { - "input": 0.8, - "output": 2.4 + "input": 2, + "output": 6, + "cache_read": 0.19999999999999998 }, "type": "chat" }, { - "id": "qwen3-vl-30b-a3b-thinking", - "name": "Qwen3 VL 30B A3B Thinking", - "display_name": "Qwen3 VL 30B A3B Thinking", + "id": "xai/grok-4.1-fast-reasoning", + "name": "Grok 4.1 Fast Reasoning", + "display_name": "Grok 4.1 Fast Reasoning", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -130083,43 +139122,35 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": true, - "release_date": "2025-10-02", - "last_updated": "2025-10-02", + "attachment": false, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "qwen2-5-vl-32b-instruct", - "name": "Qwen2.5 VL 32B Instruct", - "display_name": "Qwen2.5 VL 32B Instruct", + "id": "xai/grok-4.20-non-reasoning", + "name": "Grok 4.20 Non-Reasoning", + "display_name": "Grok 4.20 Non-Reasoning", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, @@ -130127,51 +139158,53 @@ "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-15", - "last_updated": "2025-03-15", + "open_weights": false, + "release_date": "2026-03-09", + "last_updated": "2026-03-23", "cost": { - "input": 0.3, - "output": 0.3 + "input": 2, + "output": 6, + "cache_read": 0.19999999999999998 }, "type": "chat" }, { - "id": "qwen3-vl-8b-instruct", - "name": "Qwen3 VL 8B Instruct", - "display_name": "Qwen3 VL 8B Instruct", + "id": "xai/grok-4.1-fast-non-reasoning", + "name": "Grok 4.1 Fast Non-Reasoning", + "display_name": "Grok 4.1 Fast Non-Reasoning", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 2000000, + "output": 30000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-08-19", - "last_updated": "2025-08-19", + "attachment": false, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "claude-3-7-sonnet", - "name": "Claude 3.7 Sonnet", - "display_name": "Claude 3.7 Sonnet", + "id": "xai/grok-4.20-multi-agent", + "name": "Grok 4.20 Multi-Agent", + "display_name": "Grok 4.20 Multi-Agent", "modalities": { "input": [ "text" @@ -130181,160 +139214,145 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] - } + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "release_date": "2026-03-09", + "last_updated": "2026-03-23", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3 + "input": 2, + "output": 6, + "cache_read": 0.19999999999999998 }, "type": "chat" }, { - "id": "gemini-pro-latest", - "name": "Gemini Pro Latest", - "display_name": "Gemini Pro Latest", + "id": "xai/grok-4.20-non-reasoning-beta", + "name": "Grok 4.20 Beta Non-Reasoning", + "display_name": "Grok 4.20 Beta Non-Reasoning", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-02-27", - "last_updated": "2026-02-27", + "release_date": "2026-03-11", + "last_updated": "2026-03-13", "cost": { "input": 2, - "output": 12, - "cache_read": 0.2 + "output": 6, + "cache_read": 0.19999999999999998 }, "type": "chat" }, { - "id": "claude-3-5-haiku", - "name": "Claude 3.5 Haiku", - "display_name": "Claude 3.5 Haiku", + "id": "xai/grok-imagine-image", + "name": "Grok Imagine Image", + "display_name": "Grok Imagine Image", "modalities": { "input": [ "text" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 200000, + "context": 8192, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-10-22", - "last_updated": "2024-10-22", - "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08 - }, + "release_date": "2026-01-28", + "last_updated": "2026-02-19", "type": "chat" }, { - "id": "qwen-max-latest", - "name": "Qwen Max Latest", - "display_name": "Qwen Max Latest", + "id": "xai/grok-4.3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 1000000, + "output": 1000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "release_date": "2025-01-25", - "last_updated": "2025-01-25", + "release_date": "2026-04-30", + "last_updated": "2026-05-01", "cost": { - "input": 1.6, - "output": 6.4 + "input": 1.25, + "output": 2.5, + "cache_read": 0.19999999999999998 }, "type": "chat" }, { - "id": "glm-4.6v-flash", - "name": "GLM-4.6V Flash", - "display_name": "GLM-4.6V Flash", + "id": "xai/grok-4.20-reasoning-beta", + "name": "Grok 4.20 Beta Reasoning", + "display_name": "Grok 4.20 Beta Reasoning", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, @@ -130343,50 +139361,48 @@ "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "open_weights": false, + "release_date": "2026-03-11", + "last_updated": "2026-03-13", "cost": { - "input": 0, - "output": 0 + "input": 2, + "output": 6, + "cache_read": 0.19999999999999998 }, "type": "chat" }, { - "id": "qwen3-30b-a3b-instruct-2507", - "name": "Qwen3 30B A3B Instruct (2507)", - "display_name": "Qwen3 30B A3B Instruct (2507)", + "id": "xai/grok-imagine-image-pro", + "name": "Grok Imagine Image Pro", + "display_name": "Grok Imagine Image Pro", "modalities": { "input": [ "text" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 131072, + "context": 8192, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-08", - "last_updated": "2025-07-08", - "cost": { - "input": 0.1, - "output": 0.1 - }, + "open_weights": false, + "release_date": "2026-01-28", + "last_updated": "2026-02-19", "type": "chat" }, { - "id": "minimax-text-01", - "name": "MiniMax Text 01", - "display_name": "MiniMax Text 01", + "id": "xai/grok-4.20-multi-agent-beta", + "name": "Grok 4.20 Multi Agent Beta", + "display_name": "Grok 4.20 Multi Agent Beta", "modalities": { "input": [ "text" @@ -130396,29 +139412,30 @@ ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 2000000, + "output": 2000000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-01-15", - "last_updated": "2025-01-15", + "open_weights": false, + "release_date": "2026-03-11", + "last_updated": "2026-03-13", "cost": { - "input": 0.2, - "output": 1.1 + "input": 2, + "output": 6, + "cache_read": 0.19999999999999998 }, "type": "chat" }, { - "id": "qwen3-32b-fp8", - "name": "Qwen3 32B FP8", - "display_name": "Qwen3 32B FP8", + "id": "xai/grok-4-fast-reasoning", + "name": "Grok 4 Fast Reasoning", + "display_name": "Grok 4 Fast Reasoning", "modalities": { "input": [ "text" @@ -130428,8 +139445,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 2000000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -130437,20 +139454,27 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "llama-4-scout-17b-instruct", - "name": "Llama 4 Scout 17B Instruct", - "display_name": "Llama 4 Scout 17B Instruct", + "id": "xai/grok-2-vision", + "name": "Grok 2 Vision", + "display_name": "Grok 2 Vision", "modalities": { "input": [ "text", @@ -130462,27 +139486,61 @@ }, "limit": { "context": 8192, - "output": 2048 + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", + "cost": { + "input": 2, + "output": 10, + "cache_read": 2 + }, + "type": "chat" + }, + { + "id": "interfaze/interfaze-beta", + "name": "Interfaze Beta", + "display_name": "Interfaze Beta", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 32000 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-10-07", + "last_updated": "2026-04-29", "cost": { - "input": 0.17, - "output": 0.66 + "input": 1.5, + "output": 3.5 }, "type": "chat" }, { - "id": "qwen3-4b-fp8", - "name": "Qwen3 4B FP8", - "display_name": "Qwen3 4B FP8", + "id": "meituan/longcat-flash-chat", + "name": "LongCat Flash Chat", + "display_name": "LongCat Flash Chat", "modalities": { "input": [ "text" @@ -130492,137 +139550,118 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", - "cost": { - "input": 0.03, - "output": 0.05 - }, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-08-30", + "last_updated": "2025-08-30", "type": "chat" }, { - "id": "ministral-8b-2512", - "name": "Ministral 8B", - "display_name": "Ministral 8B", + "id": "meituan/longcat-flash-thinking", + "name": "LongCat Flash Thinking", + "display_name": "LongCat Flash Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 128000, "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "attachment": false, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { "input": 0.15, - "output": 0.15 + "output": 1.5 }, "type": "chat" }, { - "id": "gemma-3-27b", - "name": "Gemma 3 27B", - "display_name": "Gemma 3 27B", + "id": "meituan/longcat-flash-thinking-2601", + "name": "LongCat Flash Thinking 2601", + "display_name": "LongCat Flash Thinking 2601", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2025-03-12", - "last_updated": "2025-03-12", - "cost": { - "input": 0.27, - "output": 0.27 + "supported": true, + "default": true }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-13", + "last_updated": "2026-03-13", "type": "chat" }, { - "id": "qwen3-vl-flash", - "name": "Qwen3 VL Flash", - "display_name": "Qwen3 VL Flash", + "id": "meta/llama-3.1-70b", + "name": "Llama 3.1 70B Instruct", + "display_name": "Llama 3.1 70B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-09", - "last_updated": "2025-10-09", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "llama-3.1-70b-instruct", - "name": "Llama 3.1 70B Instruct", - "display_name": "Llama 3.1 70B Instruct", + "id": "meta/llama-3.1-8b", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ "text" @@ -130632,28 +139671,29 @@ ] }, "limit": { - "context": 128000, - "output": 2048 + "context": 131072, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, + "open_weights": false, + "knowledge": "2023-12", "release_date": "2024-07-23", "last_updated": "2024-07-23", "cost": { - "input": 0.72, - "output": 0.72 + "input": 0.03, + "output": 0.05 }, "type": "chat" }, { - "id": "seed-1-8-251228", - "name": "Seed 1.8 (251228)", - "display_name": "Seed 1.8 (251228)", + "id": "meta/llama-3.2-90b", + "name": "Llama 3.2 90B Vision Instruct", + "display_name": "Llama 3.2 90B Vision Instruct", "modalities": { "input": [ "text", @@ -130664,30 +139704,29 @@ ] }, "limit": { - "context": 256000, + "context": 128000, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-12-18", - "last_updated": "2025-12-18", + "open_weights": false, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.05 + "input": 0.72, + "output": 0.72 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen3 235B A22B Thinking (2507)", - "display_name": "Qwen3 235B A22B Thinking (2507)", + "id": "meta/llama-3.2-3b", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ "text" @@ -130697,77 +139736,65 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-08", - "last_updated": "2025-07-08", + "open_weights": false, + "knowledge": "2023-12", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 0.8, - "output": 2.4 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "seed-1-6-250915", - "name": "Seed 1.6 (250915)", - "display_name": "Seed 1.6 (250915)", + "id": "meta/llama-3.2-1b", + "name": "Llama 3.2 1B Instruct", + "display_name": "Llama 3.2 1B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 128000, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "attachment": false, + "open_weights": false, + "knowledge": "2023-12", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.05 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "glm-4.5-x", - "name": "GLM-4.5 X", - "display_name": "GLM-4.5 X", + "id": "meta/llama-3.2-11b", + "name": "Llama 3.2 11B Vision Instruct", + "display_name": "Llama 3.2 11B Vision Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -130775,72 +139802,61 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 2.2, - "output": 8.9, - "cache_read": 0.45 + "input": 0.16, + "output": 0.16 }, "type": "chat" }, { - "id": "qwen3-30b-a3b-thinking-2507", - "name": "Qwen3 30B A3B Thinking (2507)", - "display_name": "Qwen3 30B A3B Thinking (2507)", + "id": "meta/llama-4-maverick", + "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-07-08", - "last_updated": "2025-07-08", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-4-fast-reasoning", - "name": "Grok 4 Fast Reasoning", - "display_name": "Grok 4 Fast Reasoning", + "id": "meta/llama-4-scout", + "name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "display_name": "Llama-4-Scout-17B-16E-Instruct-FP8", "modalities": { "input": [ "text", @@ -130851,39 +139867,32 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-v3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "meta/llama-3.3-70b", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -130891,104 +139900,94 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": true, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.56, - "output": 1.68, - "cache_read": 0.11 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "ministral-3b-2512", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "xiaomi/mimo-v2.5-pro", + "name": "MiMo V2.5 Pro", + "display_name": "MiMo V2.5 Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1050000, + "output": 131000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "open_weights": false, + "release_date": "2026-04-22", + "last_updated": "2026-05-01", "cost": { - "input": 0.1, - "output": 0.1 + "input": 1, + "output": 3, + "cache_read": 0.19999999999999998 }, "type": "chat" }, { - "id": "qwen-plus-latest", - "name": "Qwen Plus Latest", - "display_name": "Qwen Plus Latest", + "id": "xiaomi/mimo-v2-flash", + "name": "MiMo V2 Flash", + "display_name": "MiMo V2 Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-01-25", - "last_updated": "2025-01-25", + "knowledge": "2024-10", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.1, + "output": 0.29 }, "type": "chat" }, { - "id": "llama-3.1-nemotron-ultra-253b", - "name": "Llama 3.1 Nemotron Ultra 253B", - "display_name": "Llama 3.1 Nemotron Ultra 253B", + "id": "xiaomi/mimo-v2-pro", + "name": "MiMo V2 Pro", + "display_name": "MiMo V2 Pro", "modalities": { "input": [ "text" @@ -130998,91 +139997,116 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-07", - "last_updated": "2025-04-07", + "open_weights": false, + "release_date": "2026-03-18", + "last_updated": "2026-03-20", "cost": { - "input": 0.6, - "output": 1.8 + "input": 1, + "output": 3, + "cache_read": 0.19999999999999998 }, "type": "chat" }, { - "id": "llama-4-maverick-17b-instruct", - "name": "Llama 4 Maverick 17B Instruct", - "display_name": "Llama 4 Maverick 17B Instruct", + "id": "xiaomi/mimo-v2.5", + "name": "MiMo M2.5", + "display_name": "MiMo M2.5", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 1050000, + "output": 131100 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "release_date": "2026-04-22", + "last_updated": "2026-05-01", "cost": { - "input": 0.24, - "output": 0.97 + "input": 0.39999999999999997, + "output": 2, + "cache_read": 0.08 }, "type": "chat" - }, + } + ] + }, + "abliteration-ai": { + "id": "abliteration-ai", + "name": "abliteration.ai", + "display_name": "abliteration.ai", + "api": "https://api.abliteration.ai/v1", + "doc": "https://docs.abliteration.ai/models", + "models": [ { - "id": "grok-4-0709", - "name": "Grok 4 (0709)", - "display_name": "Grok 4 (0709)", + "id": "abliterated-model", + "name": "Abliterated Model", + "display_name": "Abliterated Model", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 150000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "attachment": true, + "open_weights": true, + "release_date": "2026-01-06", + "last_updated": "2026-01-06", "cost": { "input": 3, - "output": 15 + "output": 3 }, "type": "chat" - }, + } + ] + }, + "deepseek": { + "id": "deepseek", + "name": "DeepSeek", + "display_name": "DeepSeek", + "api": "https://api.deepseek.com", + "doc": "https://api-docs.deepseek.com/zh-cn/quick_start/pricing", + "models": [ { - "id": "qwen3-30b-a3b-fp8", - "name": "Qwen3 30B A3B FP8", - "display_name": "Qwen3 30B A3B FP8", + "id": "deepseek-chat", + "name": "DeepSeek Chat", + "display_name": "DeepSeek Chat", "modalities": { "input": [ "text" @@ -131092,29 +140116,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "knowledge": "2025-09", + "release_date": "2024-12-26", + "last_updated": "2026-04-24", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "minimax-m2.1-lightning", - "name": "MiniMax M2.1 Lightning", - "display_name": "MiniMax M2.1 Lightning", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -131124,43 +140149,64 @@ ] }, "limit": { - "context": 196608, - "output": 131072 + "context": 1048576, + "output": 393216 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Thinking mode is controlled through the thinking parameter; non-thinking mode disables reasoning." + ] + } + }, + "attachment": true, "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.12, - "output": 0.48 + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "qwen3-max-2026-01-23", - "name": "Qwen3 Max (2026-01-23)", - "display_name": "Qwen3 Max (2026-01-23)", + "id": "deepseek-reasoner", + "name": "DeepSeek Reasoner", + "display_name": "DeepSeek Reasoner", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32800 + "context": 1048576, + "output": 393216 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -131169,29 +140215,39 @@ "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Compatibility alias for deepseek-v4-flash thinking mode." ] } }, "attachment": true, - "open_weights": false, - "release_date": "2026-01-23", - "last_updated": "2026-01-23", + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2025-01-20", + "last_updated": "2026-04-24", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.6 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "llama-3.2-3b-instruct", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -131201,28 +140257,59 @@ ] }, "limit": { - "context": 32768, - "output": 32000 + "context": 1048576, + "output": 393216 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Thinking mode is controlled through the thinking parameter; non-thinking mode disables reasoning." + ] + } + }, + "attachment": true, "open_weights": true, - "release_date": "2024-09-18", - "last_updated": "2024-09-18", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.03, - "output": 0.05 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" - }, + } + ] + }, + "perplexity": { + "id": "perplexity", + "name": "Perplexity", + "display_name": "Perplexity", + "doc": "https://docs.perplexity.ai", + "models": [ { - "id": "qwen3-coder-next", - "name": "Qwen3 Coder Next", - "display_name": "Qwen3 Coder Next", + "id": "sonar", + "name": "Sonar", + "display_name": "Sonar", "modalities": { "input": [ "text" @@ -131232,33 +140319,32 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 0.8, - "output": 4 + "input": 1, + "output": 1 }, "type": "chat" }, { - "id": "gpt-4o-search-preview", - "name": "GPT-4o Search Preview", - "display_name": "GPT-4o Search Preview", + "id": "sonar-deep-research", + "name": "Perplexity Sonar Deep Research", + "display_name": "Perplexity Sonar Deep Research", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -131266,27 +140352,30 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "knowledge": "2025-01", + "release_date": "2025-02-01", + "last_updated": "2025-09-01", "cost": { - "input": 2.5, - "output": 10 + "input": 2, + "output": 8, + "reasoning": 3 }, "type": "chat" }, { - "id": "custom", - "name": "Custom Model", - "display_name": "Custom Model", + "id": "sonar-reasoning-pro", + "name": "Sonar Reasoning Pro", + "display_name": "Sonar Reasoning Pro", "modalities": { "input": [ "text", @@ -131298,27 +140387,29 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, + "knowledge": "2025-09-01", "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 0, - "output": 0 + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "qwen3-vl-30b-a3b-instruct", - "name": "Qwen3 VL 30B A3B Instruct", - "display_name": "Qwen3 VL 30B A3B Instruct", + "id": "sonar-pro", + "name": "Sonar Pro", + "display_name": "Sonar Pro", "modalities": { "input": [ "text", @@ -131329,67 +140420,81 @@ ] }, "limit": { - "context": 131072, + "context": 200000, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-10-02", - "last_updated": "2025-10-02", + "open_weights": false, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 0.1, - "output": 0.1 + "input": 3, + "output": 15 }, "type": "chat" - }, + } + ] + }, + "iflowcn": { + "id": "iflowcn", + "name": "iFlow", + "display_name": "iFlow", + "api": "https://apis.iflow.cn/v1", + "doc": "https://platform.iflow.cn/en/docs", + "models": [ { - "id": "deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "qwen3-max-preview", + "name": "Qwen3-Max-Preview", + "display_name": "Qwen3-Max-Preview", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 16384 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": true, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.28, - "output": 0.42, - "cache_read": 0.03 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-fp8", - "name": "Qwen3 235B A22B FP8", - "display_name": "Qwen3 235B A22B FP8", + "id": "kimi-k2-0905", + "name": "Kimi-K2-0905", + "display_name": "Kimi-K2-0905", "modalities": { "input": [ "text" @@ -131399,66 +140504,73 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.5, - "output": 2.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "qwen3-vl-plus", + "name": "Qwen3-VL-Plus", + "display_name": "Qwen3-VL-Plus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32766 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.1, - "output": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "kimi-k2", - "name": "Kimi K2", - "display_name": "Kimi K2", + "id": "qwen3-235b", + "name": "Qwen3-235B-A22B", + "display_name": "Qwen3-235B-A22B", "modalities": { "input": [ "text" @@ -131468,92 +140580,30 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-11", - "last_updated": "2025-07-11", - "cost": { - "input": 1, - "output": 3, - "cache_read": 0.5 - }, - "type": "chat" - }, - { - "id": "llama-3-8b-instruct", - "name": "Llama 3 8B Instruct", - "display_name": "Llama 3 8B Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-04-03", - "last_updated": "2025-04-03", - "cost": { - "input": 0.04, - "output": 0.04 - }, - "type": "chat" - }, - { - "id": "qwen3-vl-235b-a22b-instruct", - "name": "Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen3 VL 235B A22B Instruct", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.8, - "output": 2.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -131563,8 +140613,8 @@ ] }, "limit": { - "context": 131072, - "output": 32766 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -131574,23 +140624,30 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.15, - "output": 0.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen25-coder-7b", - "name": "Qwen2.5 Coder 7B", - "display_name": "Qwen2.5 Coder 7B", + "id": "deepseek-v3.2", + "name": "DeepSeek-V3.2-Exp", + "display_name": "DeepSeek-V3.2-Exp", "modalities": { "input": [ "text" @@ -131600,28 +140657,34 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2024-09-19", - "last_updated": "2024-09-19", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.05, - "output": 0.05 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "deepseek-v3", + "name": "DeepSeek-V3", + "display_name": "DeepSeek-V3", "modalities": { "input": [ "text" @@ -131632,7 +140695,7 @@ }, "limit": { "context": 128000, - "output": 2048 + "output": 32000 }, "temperature": true, "tool_call": true, @@ -131641,18 +140704,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2024-10", + "release_date": "2024-12-26", + "last_updated": "2024-12-26", "cost": { - "input": 0.22, - "output": 0.22 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "llama-3-70b-instruct", - "name": "Llama 3 70B Instruct", - "display_name": "Llama 3 70B Instruct", + "id": "qwen3-max", + "name": "Qwen3-Max", + "display_name": "Qwen3-Max", "modalities": { "input": [ "text" @@ -131662,28 +140726,40 @@ ] }, "limit": { - "context": 8192, - "output": 8000 + "context": 256000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.51, - "output": 0.74 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-r1-0528", - "name": "DeepSeek R1 (0528)", - "display_name": "DeepSeek R1 (0528)", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -131693,40 +140769,35 @@ ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 200000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2025-11-13", "cost": { - "input": 0.8, - "output": 2.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "glm-4.5-airx", - "name": "GLM-4.5 AirX", - "display_name": "GLM-4.5 AirX", + "id": "qwen3-32b", + "name": "Qwen3-32B", + "display_name": "Qwen3-32B", "modalities": { "input": [ "text" @@ -131737,60 +140808,83 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 1.1, - "output": 4.5, - "cache_read": 0.22 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "ministral-14b-2512", - "name": "Ministral 14B", - "display_name": "Ministral 14B", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen3-235B-A22B-Thinking", + "display_name": "Qwen3-235B-A22B-Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 8192 + "context": 256000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "knowledge": "2025-04", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "llama-3.2-11b-instruct", - "name": "Llama 3.2 11B Instruct", - "display_name": "Llama 3.2 11B Instruct", + "id": "kimi-k2", + "name": "Kimi-K2", + "display_name": "Kimi-K2", "modalities": { "input": [ "text" @@ -131801,60 +140895,60 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.07, - "output": 0.33 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-3-opus", - "name": "Claude 3 Opus", - "display_name": "Claude 3 Opus", + "id": "qwen3-coder-plus", + "name": "Qwen3-Coder-Plus", + "display_name": "Qwen3-Coder-Plus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-03-04", - "last_updated": "2024-03-04", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "minimax-m2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "qwen3-235b-a22b-instruct", + "name": "Qwen3-235B-A22B-Instruct", + "display_name": "Qwen3-235B-A22B-Instruct", "modalities": { "input": [ "text" @@ -131864,80 +140958,69 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-04", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0, + "output": 0 }, "type": "chat" - }, + } + ] + }, + "stackit": { + "id": "stackit", + "name": "STACKIT", + "display_name": "STACKIT", + "api": "https://api.openai-compat.model-serving.eu01.onstackit.cloud/v1", + "doc": "https://docs.stackit.cloud/products/data-and-ai/ai-model-serving/basics/available-shared-models", + "models": [ { - "id": "grok-4-20-beta-0309-non-reasoning", - "name": "Grok 4.20 (Non-Reasoning)", - "display_name": "Grok 4.20 (Non-Reasoning)", + "id": "neuralmagic/Meta-Llama-3.1-8B-Instruct-FP8", + "name": "Llama 3.1 8B", + "display_name": "Llama 3.1 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-09", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 12, - "cache_read": 0.4 - } + "input": 0.16, + "output": 0.27 }, "type": "chat" }, { - "id": "qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "neuralmagic/Mistral-Nemo-Instruct-2407-FP8", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -131947,8 +141030,8 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -131957,74 +141040,60 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 1, - "output": 5 + "input": 0.49, + "output": 0.71 }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5 (latest)", - "display_name": "Claude Haiku 4.5 (latest)", + "id": "cortecs/Llama-3.3-70B-Instruct-FP8-Dynamic", + "name": "Llama 3.3 70B", + "display_name": "Llama 3.3 70B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.49, + "output": 0.71 }, "type": "chat" }, { - "id": "claude-opus-4-5-20251101", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS 120B", + "display_name": "GPT-OSS 120B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -132032,138 +141101,100 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.49, + "output": 0.71 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-09-2025", - "name": "Gemini 2.5 Flash Lite Preview 09-25", - "display_name": "Gemini 2.5 Flash Lite Preview 09-25", + "id": "google/gemma-3-27b-it", + "name": "Gemma 3 27B", + "display_name": "Gemma 3 27B", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 37000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "open_weights": true, + "release_date": "2025-05-17", + "last_updated": "2025-05-17", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.49, + "output": 0.71 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "intfloat/e5-mistral-7b-instruct", + "name": "E5 Mistral 7B", + "display_name": "E5 Mistral 7B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 4096, + "output": 4096 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", + "release_date": "2023-12-11", + "last_updated": "2023-12-11", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 0.02, + "output": 0.02 }, "type": "chat" }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "Qwen/Qwen3-VL-235B-A22B-Instruct-FP8", + "name": "Qwen3-VL 235B", + "display_name": "Qwen3-VL 235B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 218000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -132172,19 +141203,18 @@ }, "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0, - "output": 0 + "input": 1.64, + "output": 1.91 }, "type": "chat" }, { - "id": "mistral-large-2512", - "name": "Mistral Large 3", - "display_name": "Mistral Large 3", + "id": "Qwen/Qwen3-VL-Embedding-8B", + "name": "Qwen3-VL Embedding 8B", + "display_name": "Qwen3-VL Embedding 8B", "modalities": { "input": [ "text", @@ -132195,42 +141225,51 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 32000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2025-12-02", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.09, + "output": 0.09 }, "type": "chat" - }, + } + ] + }, + "evroc": { + "id": "evroc", + "name": "evroc", + "display_name": "evroc", + "api": "https://models.think.evroc.com/v1", + "doc": "https://docs.evroc.com/products/think/overview.html", + "models": [ { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 262144 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -132249,66 +141288,49 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 1.47, + "output": 5.9 }, "type": "chat" }, { - "id": "minimax-m2.7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "openai/whisper-large-v3", + "name": "Whisper 3 Large", + "display_name": "Whisper 3 Large", "modalities": { "input": [ - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 448, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0.00236, + "output": 0.00236, + "output_audio": 2.36 }, "type": "chat" }, { - "id": "mimo-v2.5-pro", - "name": "MiMo-V2.5-Pro", - "display_name": "MiMo-V2.5-Pro", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -132318,10 +141340,9 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 65536, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -132329,158 +141350,116 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2, - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0.24, + "output": 0.94 }, "type": "chat" }, { - "id": "gemma-3n-e4b-it", - "name": "Gemma 3n 4B", - "display_name": "Gemma 3n 4B", + "id": "KBLab/kb-whisper-large", + "name": "KB Whisper", + "display_name": "KB Whisper", "modalities": { "input": [ - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2000 + "context": 448, + "output": 448 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 0, - "output": 0 + "input": 0.00236, + "output": 0.00236, + "output_audio": 2.36 }, "type": "chat" }, { - "id": "claude-3-5-sonnet-20241022", - "name": "Claude Sonnet 3.5 v2", - "display_name": "Claude Sonnet 3.5 v2", + "id": "nvidia/Llama-3.3-70B-Instruct-FP8", + "name": "Llama 3.3 70B", + "display_name": "Llama 3.3 70B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 131072, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "attachment": false, + "open_weights": true, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1.18, + "output": 1.18 }, "type": "chat" }, { - "id": "gpt-5.2-pro", - "name": "GPT-5.2 Pro", - "display_name": "GPT-5.2 Pro", + "id": "mistralai/Voxtral-Small-24B-2507", + "name": "Voxtral Small 24B", + "display_name": "Voxtral Small 24B", "modalities": { "input": [ - "text", - "image" + "audio", + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32000, + "output": 32000 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 21, - "output": 168 + "input": 0.00236, + "output": 0.00236, + "output_audio": 2.36 }, "type": "chat" }, { - "id": "qwq-plus", - "name": "QwQ Plus", - "display_name": "QwQ Plus", + "id": "mistralai/devstral-small-2-24b-instruct-2512", + "name": "Devstral Small 2 24B Instruct 2512", + "display_name": "Devstral Small 2 24B Instruct 2512", "modalities": { "input": [ "text" @@ -132490,85 +141469,57 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32768, + "output": 32768 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-03-05", - "last_updated": "2025-03-05", + "open_weights": true, + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.8, - "output": 2.4 + "input": 0.12, + "output": 0.47 }, "type": "chat" }, { - "id": "gemini-3.1-flash-lite-preview", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "mistralai/Magistral-Small-2509", + "name": "Magistral Small 1.2 24B", + "display_name": "Magistral Small 1.2 24B", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 131072 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "attachment": false, + "open_weights": true, + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "input": 0.59, + "output": 2.36 }, "type": "chat" }, { - "id": "qwen-vl-plus", - "name": "Qwen-VL Plus", - "display_name": "Qwen-VL Plus", + "id": "microsoft/Phi-4-multimodal-instruct", + "name": "Phi-4 15B", + "display_name": "Phi-4 15B", "modalities": { "input": [ "text", @@ -132579,29 +141530,27 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32000, + "output": 32000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", - "last_updated": "2025-08-15", + "open_weights": true, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.21, - "output": 0.63 + "input": 0.24, + "output": 0.47 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "intfloat/multilingual-e5-large-instruct", + "name": "E5 Multi-Lingual Large Embeddings 0.6B", + "display_name": "E5 Multi-Lingual Large Embeddings 0.6B", "modalities": { "input": [ "text" @@ -132611,74 +141560,59 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 512, + "output": 512 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2, - "cache_write": 0 + "input": 0.12, + "output": 0.12 }, "type": "chat" }, { - "id": "devstral-2512", - "name": "Devstral 2", - "display_name": "Devstral 2", + "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "name": "Qwen3 VL 30B", + "display_name": "Qwen3 VL 30B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 100000, + "output": 100000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { - "input": 0.4, - "output": 2 + "input": 0.24, + "output": 0.94 }, "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507-FP8", + "name": "Qwen3 30B 2507", + "display_name": "Qwen3 30B 2507", "modalities": { "input": [ "text" @@ -132688,116 +141622,80 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 64000, + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { - "input": 0.7, - "output": 2.8, - "reasoning": 8.4 + "input": 0.35, + "output": 1.42 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "Qwen/Qwen3-Embedding-8B", + "name": "Qwen3 Embedding 8B", + "display_name": "Qwen3 Embedding 8B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 40960, + "output": 40960 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.12, + "output": 0.12 }, - "type": "chat" - }, + "type": "embedding" + } + ] + }, + "nova": { + "id": "nova", + "name": "Nova", + "display_name": "Nova", + "api": "https://api.nova.amazon.com/v1", + "doc": "https://nova.amazon.com/dev/documentation", + "models": [ { - "id": "glm-4.7-flashx", - "name": "GLM-4.7-FlashX", - "display_name": "GLM-4.7-FlashX", + "id": "nova-2-pro-v1", + "name": "Nova 2 Pro", + "display_name": "Nova 2 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -132805,29 +141703,26 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", - "cost": { - "input": 0.07, - "output": 0.4, - "cache_read": 0.01, - "cache_write": 0 + "attachment": true, + "open_weights": false, + "release_date": "2025-12-03", + "last_updated": "2026-01-03", + "cost": { + "input": 0, + "output": 0, + "reasoning": 0 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "nova-2-lite-v1", + "name": "Nova 2 Lite", + "display_name": "Nova 2 Lite", "modalities": { "input": [ "text", "image", "video", - "audio", "pdf" ], "output": [ @@ -132835,8 +141730,8 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -132844,58 +141739,40 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0, + "output": 0, + "reasoning": 0 }, "type": "chat" - }, + } + ] + }, + "venice": { + "id": "venice", + "name": "Venice AI", + "display_name": "Venice AI", + "doc": "https://docs.venice.ai", + "models": [ { - "id": "qwen35-397b-a17b", - "name": "Qwen3.5 397B-A17B", - "display_name": "Qwen3.5 397B-A17B", + "id": "z-ai-glm-5-turbo", + "name": "GLM 5 Turbo", + "display_name": "GLM 5 Turbo", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -132903,20 +141780,21 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-02-15", - "last_updated": "2026-02-15", + "release_date": "2026-03-15", + "last_updated": "2026-04-12", "cost": { - "input": 0.6, - "output": 3.6 + "input": 1.2, + "output": 4, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "qwen-max", - "name": "Qwen Max", - "display_name": "Qwen Max", + "id": "hermes-3-llama-3.1-405b", + "name": "Hermes 3 Llama 3.1 405b", + "display_name": "Hermes 3 Llama 3.1 405b", "modalities": { "input": [ "text" @@ -132926,29 +141804,29 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, + "open_weights": true, "knowledge": "2024-04", - "release_date": "2024-04-03", - "last_updated": "2025-01-25", + "release_date": "2025-09-25", + "last_updated": "2026-03-12", "cost": { - "input": 1.6, - "output": 6.4 + "input": 1.1, + "output": 3 }, "type": "chat" }, { - "id": "gpt-5.3-chat-latest", - "name": "GPT-5.3 Chat (latest)", - "display_name": "GPT-5.3 Chat (latest)", + "id": "qwen3-vl-235b-a22b", + "name": "Qwen3 VL 235B", + "display_name": "Qwen3 VL 235B", "modalities": { "input": [ "text", @@ -132959,45 +141837,51 @@ ] }, "limit": { - "context": 128000, + "context": 256000, "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "open_weights": true, + "release_date": "2026-01-16", + "last_updated": "2026-03-12", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.25, + "output": 1.5 }, "type": "chat" }, { - "id": "gemini-2.0-flash", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "google-gemma-3-27b-it", + "name": "Google Gemma 3 27B Instruct", + "display_name": "Google Gemma 3 27B Instruct", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 198000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -133005,36 +141889,32 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-11-04", + "last_updated": "2026-03-12", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.12, + "output": 0.2 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "grok-4-3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -133042,46 +141922,37 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "release_date": "2026-04-18", + "last_updated": "2026-05-04", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, + "input": 1.42, + "output": 2.83, + "cache_read": 0.23, + "tiers": [ + { + "input": 2.83, + "output": 5.67, + "cache_read": 0.45, + "tier": { + "type": "context", + "size": 200000 + } + } + ], "context_over_200k": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 + "input": 2.83, + "output": 5.67, + "cache_read": 0.45 } }, "type": "chat" }, { - "id": "qwen-plus", - "name": "Qwen Plus", - "display_name": "Qwen Plus", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -133112,36 +141983,33 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", - "last_updated": "2025-09-11", + "open_weights": true, + "release_date": "2026-04-24", + "last_updated": "2026-04-29", "cost": { - "input": 0.4, - "output": 1.2, - "reasoning": 4 + "input": 1.73, + "output": 3.796, + "cache_read": 0.33 }, "type": "chat" }, { - "id": "gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "zai-org-glm-5", + "name": "GLM 5", + "display_name": "GLM 5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 198000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -133150,59 +142018,40 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-03-12", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "qwen3.6-35b-a3b", - "name": "Qwen3.6 35B-A3B", - "display_name": "Qwen3.6 35B-A3B", + "id": "deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 160000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -133212,128 +142061,90 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "knowledge": "2025-10", + "release_date": "2025-12-04", + "last_updated": "2026-03-24", "cost": { - "input": 0.248, - "output": 1.485 + "input": 0.33, + "output": 0.48, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "qwen-omni-turbo", - "name": "Qwen-Omni Turbo", - "display_name": "Qwen-Omni Turbo", + "id": "mistral-small-2603", + "name": "Mistral Small 4", + "display_name": "Mistral Small 4", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-19", - "last_updated": "2025-03-26", + "attachment": true, + "open_weights": true, + "release_date": "2026-03-16", + "last_updated": "2026-04-09", "cost": { - "input": 0.07, - "output": 0.27, - "input_audio": 4.44, - "output_audio": 8.89 + "input": 0.1875, + "output": 0.75 }, "type": "chat" }, { - "id": "claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "zai-org-glm-4.7-flash", + "name": "GLM 4.7 Flash", + "display_name": "GLM 4.7 Flash", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 128000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "attachment": false, + "open_weights": true, + "release_date": "2026-01-29", + "last_updated": "2026-03-12", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.125, + "output": 0.5 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", @@ -133344,10 +142155,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 198000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -133355,55 +142166,38 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-01-15", + "last_updated": "2026-04-12", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 3.75, + "output": 18.75, + "cache_read": 0.375, + "cache_write": 4.69 }, "type": "chat" }, { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "arcee-trinity-large-thinking", + "name": "Trinity Large Thinking", + "display_name": "Trinity Large Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -133412,146 +142206,96 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-02", + "last_updated": "2026-04-04", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 0.3125, + "output": 1.125, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "mimo-v2-omni", - "name": "MiMo-V2-Omni", - "display_name": "MiMo-V2-Omni", + "id": "venice-uncensored-1-2", + "name": "Venice Uncensored 1.2", + "display_name": "Venice Uncensored 1.2", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": true, + "release_date": "2026-04-01", + "last_updated": "2026-04-19", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08 + "input": 0.2, + "output": 0.9 }, "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "grok-41-fast", + "name": "Grok 4.1 Fast", + "display_name": "Grok 4.1 Fast", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 30000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2025-07", + "release_date": "2025-12-01", + "last_updated": "2026-04-09", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.23, + "output": 0.57, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "minimax-m2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "minimax-m27", + "name": "MiniMax M2.7", + "display_name": "MiniMax M2.7", "modalities": { "input": [ "text" @@ -133561,8 +142305,8 @@ ] }, "limit": { - "context": 196608, - "output": 128000 + "context": 198000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -133570,38 +142314,33 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "open_weights": false, + "release_date": "2026-03-18", + "last_updated": "2026-04-12", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.375, + "output": 1.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "openai-gpt-55", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -133611,21 +142350,35 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2026-04-23", + "last_updated": "2026-04-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 6.25, + "output": 37.5, + "cache_read": 0.625, + "tiers": [ + { + "input": 12.5, + "output": 56.25, + "cache_read": 1.25, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 12.5, + "output": 56.25, + "cache_read": 1.25 + } }, "type": "chat" }, { - "id": "qwen-flash", - "name": "Qwen Flash", - "display_name": "Qwen Flash", + "id": "nvidia-nemotron-cascade-2-30b-a3b", + "name": "Nemotron Cascade 2 30B A3B", + "display_name": "Nemotron Cascade 2 30B A3B", "modalities": { "input": [ "text" @@ -133635,7 +142388,7 @@ ] }, "limit": { - "context": 1000000, + "context": 256000, "output": 32768 }, "temperature": true, @@ -133644,36 +142397,54 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2026-03-24", + "last_updated": "2026-04-09", + "cost": { + "input": 0.14, + "output": 0.8 + }, + "type": "chat" + }, + { + "id": "mistral-small-3-2-24b-instruct", + "name": "Mistral Small 3.2 24B Instruct", + "display_name": "Mistral Small 3.2 24B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": true, + "release_date": "2026-01-15", + "last_updated": "2026-03-16", "cost": { - "input": 0.05, - "output": 0.4 + "input": 0.09375, + "output": 0.25 }, "type": "chat" }, { - "id": "gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "nvidia-nemotron-3-nano-30b-a3b", + "name": "NVIDIA Nemotron 3 Nano 30B", + "display_name": "NVIDIA Nemotron 3 Nano 30B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -133681,104 +142452,71 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "attachment": false, + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-03-12", "cost": { - "input": 10, - "output": 30 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "openai-gpt-4o-mini-2024-07-18", + "name": "GPT-4o Mini", + "display_name": "GPT-4o Mini", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "release_date": "2026-02-28", + "last_updated": "2026-03-06", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 0.1875, + "output": 0.75, + "cache_read": 0.09375 }, "type": "chat" }, { - "id": "mimo-v2.5", - "name": "MiMo-V2.5", - "display_name": "MiMo-V2.5", + "id": "zai-org-glm-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 198000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -133797,61 +142535,87 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2024-04-01", + "last_updated": "2026-04-04", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08, - "context_over_200k": { - "input": 0.8, - "output": 4, - "cache_read": 0.16 - } + "input": 0.85, + "output": 2.75, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "Grok 4.1 Fast (Non-Reasoning)", - "display_name": "Grok 4.1 Fast (Non-Reasoning)", + "id": "llama-3.2-3b", + "name": "Llama 3.2 3B", + "display_name": "Llama 3.2 3B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-10-03", + "last_updated": "2026-03-12", + "cost": { + "input": 0.15, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "openai-gpt-52", + "name": "GPT-5.2", + "display_name": "GPT-5.2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "knowledge": "2025-08-31", + "release_date": "2025-12-13", + "last_updated": "2026-03-12", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 2.19, + "output": 17.5, + "cache_read": 0.219 }, "type": "chat" }, { - "id": "sonar-pro", - "name": "Sonar Pro", - "display_name": "Sonar Pro", + "id": "gemma-4-uncensored", + "name": "Gemma 4 Uncensored", + "display_name": "Gemma 4 Uncensored", "modalities": { "input": [ "text", @@ -133862,29 +142626,72 @@ ] }, "limit": { - "context": 200000, + "context": 256000, "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, + "open_weights": true, + "release_date": "2026-04-13", + "last_updated": "2026-04-19", + "cost": { + "input": 0.1625, + "output": 0.5 + }, + "type": "chat" + }, + { + "id": "minimax-m25", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 198000, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "release_date": "2026-02-12", + "last_updated": "2026-04-12", "cost": { - "input": 3, - "output": 15 + "input": 0.34, + "output": 1.19, + "cache_read": 0.04 }, "type": "chat" }, { - "id": "pixtral-large-latest", - "name": "Pixtral Large (latest)", - "display_name": "Pixtral Large (latest)", + "id": "openai-gpt-55-pro", + "name": "GPT-5.5 Pro", + "display_name": "GPT-5.5 Pro", "modalities": { "input": [ "text", @@ -133895,29 +142702,29 @@ ] }, "limit": { - "context": 128000, + "context": 1000000, "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2024-11-04", + "open_weights": false, + "release_date": "2026-04-24", + "last_updated": "2026-04-25", "cost": { - "input": 2, - "output": 6 + "input": 37.5, + "output": 225 }, "type": "chat" }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", @@ -133928,10 +142735,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -133941,40 +142748,45 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] } }, "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2026-02-17", + "last_updated": "2026-03-16", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 3.6, + "output": 18, + "cache_read": 0.36, + "cache_write": 4.5 }, "type": "chat" }, { - "id": "grok-4-20-beta-0309-reasoning", - "name": "Grok 4.20 (Reasoning)", - "display_name": "Grok 4.20 (Reasoning)", + "id": "kimi-k2-6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", @@ -133985,8 +142797,8 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -133994,31 +142806,35 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-09", + "open_weights": true, + "release_date": "2026-04-20", + "last_updated": "2026-04-30", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 12, - "cache_read": 0.4 - } + "input": 0.85, + "output": 4.655, + "cache_read": 0.22 }, "type": "chat" }, { - "id": "gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "llama-3.3-70b", + "name": "Llama 3.3 70B", + "display_name": "Llama 3.3 70B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -134026,34 +142842,32 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-04-06", + "last_updated": "2026-03-12", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "input": 0.7, + "output": 2.8 }, "type": "chat" }, { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "claude-opus-4-6-fast", + "name": "Claude Opus 4.6 Fast", + "display_name": "Claude Opus 4.6 Fast", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" @@ -134061,153 +142875,188 @@ }, "limit": { "context": 1000000, - "output": 65536 + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "knowledge": "2025-05-31", + "release_date": "2026-04-08", + "last_updated": "2026-04-08", "cost": { - "input": 0.276, - "output": 1.651, - "cache_read": 0.028, - "cache_write": 0.344 + "input": 36, + "output": 180, + "cache_read": 3.6, + "cache_write": 45 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 mini", - "display_name": "GPT-5.4 mini", + "id": "qwen3-5-35b-a3b", + "name": "Qwen 3.5 35B A3B", + "display_name": "Qwen 3.5 35B A3B", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "open_weights": true, + "release_date": "2026-02-25", + "last_updated": "2026-04-16", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 0.3125, + "output": 1.25, + "cache_read": 0.15625 }, "type": "chat" }, { - "id": "qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "qwen3-5-397b-a17b", + "name": "Qwen 3.5 397B", + "display_name": "Qwen 3.5 397B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": true, + "open_weights": true, + "release_date": "2026-02-16", + "last_updated": "2026-04-16", + "cost": { + "input": 0.75, + "output": 4.5 }, - "attachment": false, + "type": "chat" + }, + { + "id": "grok-4-20-multi-agent", + "name": "Grok 4.20 Multi-Agent", + "display_name": "Grok 4.20 Multi-Agent", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2000000, + "output": 128000 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "release_date": "2026-03-12", + "last_updated": "2026-05-07", "cost": { - "input": 1.2, - "output": 6 + "input": 1.42, + "output": 2.83, + "cache_read": 0.23, + "tiers": [ + { + "input": 2.83, + "output": 5.67, + "cache_read": 0.45, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.83, + "output": 5.67, + "cache_read": 0.45 + } }, "type": "chat" }, { - "id": "minimax-m2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "openai-gpt-54-mini", + "name": "GPT-5.4 Mini", + "display_name": "GPT-5.4 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -134215,25 +143064,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-27", + "last_updated": "2026-03-31", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.9375, + "output": 5.625, + "cache_read": 0.09375 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "olafangensan-glm-4.7-flash-heretic", + "name": "GLM 4.7 Flash Heretic", + "display_name": "GLM 4.7 Flash Heretic", "modalities": { "input": [ "text" @@ -134244,7 +143089,7 @@ }, "limit": { "context": 200000, - "output": 131072 + "output": 24000 }, "temperature": true, "tool_call": true, @@ -134252,33 +143097,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "open_weights": true, + "release_date": "2026-02-04", + "last_updated": "2026-03-12", "cost": { - "input": 6, - "output": 24, - "cache_read": 1.3, - "cache_write": 0 + "input": 0.14, + "output": 0.8 }, "type": "chat" }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "grok-4-20", + "name": "Grok 4.20", + "display_name": "Grok 4.20", "modalities": { "input": [ "text", @@ -134289,45 +143121,46 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 2000000, + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2026-03-12", + "last_updated": "2026-05-07", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 1.42, + "output": 2.83, + "cache_read": 0.23, + "tiers": [ + { + "input": 2.83, + "output": 5.67, + "cache_read": 0.45, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.83, + "output": 5.67, + "cache_read": 0.45 + } }, "type": "chat" }, { - "id": "gpt-5.4-nano", - "name": "GPT-5.4 nano", - "display_name": "GPT-5.4 nano", + "id": "claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", @@ -134338,7 +143171,7 @@ ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, "temperature": false, @@ -134352,50 +143185,54 @@ "supported": true, "default_enabled": false, "mode": "effort", - "effort": "none", + "effort": "high", "effort_options": [ - "none", "low", "medium", "high", "xhigh" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 6, + "output": 30, + "cache_read": 0.6, + "cache_write": 7.5 }, "type": "chat" }, { - "id": "glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "qwen-3-6-plus", + "name": "Qwen 3.6 Plus Uncensored", + "display_name": "Qwen 3.6 Plus Uncensored", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -134403,23 +143240,40 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-06", + "last_updated": "2026-04-12", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.625, + "output": 3.75, + "cache_read": 0.0625, + "cache_write": 0.78, + "tiers": [ + { + "input": 2.5, + "output": 7.5, + "cache_read": 0.0625, + "cache_write": 0.78, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 7.5, + "cache_read": 0.0625, + "cache_write": 0.78 + } }, "type": "chat" }, { - "id": "mistral-large-latest", - "name": "Mistral Large (latest)", - "display_name": "Mistral Large (latest)", + "id": "openai-gpt-54-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ "text", @@ -134430,99 +143284,125 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2025-12-02", + "open_weights": false, + "release_date": "2026-03-05", + "last_updated": "2026-03-09", "cost": { - "input": 0.5, - "output": 1.5 + "input": 37.5, + "output": 225, + "tiers": [ + { + "input": 75, + "output": 337.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 75, + "output": 337.5 + } }, "type": "chat" }, { - "id": "mistral-small-2506", - "name": "Mistral Small 3.2", - "display_name": "Mistral Small 3.2", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-06-20", - "last_updated": "2025-06-20", + "release_date": "2026-04-24", + "last_updated": "2026-04-29", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.17, + "output": 0.35, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "gemma-3-12b-it", - "name": "Gemma 3 12B", - "display_name": "Gemma 3 12B", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen 3 235B A22B Instruct 2507", + "display_name": "Qwen 3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "knowledge": "2025-07", + "release_date": "2025-04-29", + "last_updated": "2026-03-12", "cost": { - "input": 0, - "output": 0 + "input": 0.15, + "output": 0.75 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -134530,10 +143410,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -134543,53 +143423,50 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ + "mode": "level", + "level": "high", + "level_options": [ + "minimal", "low", "medium", "high" ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2025-01", + "release_date": "2025-12-19", + "last_updated": "2026-03-12", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.7, + "output": 3.75, + "cache_read": 0.07 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "qwen3-6-27b", + "name": "Qwen 3.6 27B", + "display_name": "Qwen 3.6 27B", "modalities": { "input": [ "text", "image", - "audio", - "video", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 256000, "output": 65536 }, "temperature": true, @@ -134598,43 +143475,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-29", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.03, - "input_audio": 1 + "input": 0.325, + "output": 3.25 }, "type": "chat" }, { - "id": "gpt-5.2-chat-latest", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", + "id": "qwen3-5-9b", + "name": "Qwen 3.5 9B", + "display_name": "Qwen 3.5 9B", "modalities": { "input": [ "text", @@ -134645,31 +143499,29 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 256000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "open_weights": true, + "release_date": "2026-03-05", + "last_updated": "2026-04-19", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.1, + "output": 0.15 }, "type": "chat" }, { - "id": "gemma-3n-e2b-it", - "name": "Gemma 3n 2B", - "display_name": "Gemma 3n 2B", + "id": "qwen3-coder-480b-a35b-instruct-turbo", + "name": "Qwen 3 Coder 480B Turbo", + "display_name": "Qwen 3 Coder 480B Turbo", "modalities": { "input": [ "text" @@ -134679,29 +143531,29 @@ ] }, "limit": { - "context": 8192, - "output": 2000 + "context": 256000, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2026-01-27", + "last_updated": "2026-02-26", "cost": { - "input": 0, - "output": 0 + "input": 0.35, + "output": 1.5, + "cache_read": 0.04 }, "type": "chat" }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex mini", - "display_name": "GPT-5.1 Codex mini", + "id": "claude-opus-4-7-fast", + "name": "Claude Opus 4.7 Fast", + "display_name": "Claude Opus 4.7 Fast", "modalities": { "input": [ "text", @@ -134712,10 +143564,10 @@ ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -134726,38 +143578,41 @@ "supported": true, "default_enabled": false, "mode": "effort", - "effort": "none", + "effort": "high", "effort_options": [ - "none", "low", "medium", - "high" + "high", + "xhigh" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2026-05-14", + "last_updated": "2026-05-14", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 36, + "output": 180, + "cache_read": 3.6, + "cache_write": 45 }, "type": "chat" }, { - "id": "grok-4-fast", - "name": "Grok 4 Fast", - "display_name": "Grok 4 Fast", + "id": "openai-gpt-52-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ "text", @@ -134768,8 +143623,8 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -134779,35 +143634,31 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "knowledge": "2025-08", + "release_date": "2025-01-15", + "last_updated": "2026-03-12", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 2.19, + "output": 17.5, + "cache_read": 0.219 }, "type": "chat" }, { - "id": "gemini-3.1-flash-lite", - "name": "Gemini 3.1 Flash Lite", - "display_name": "Gemini 3.1 Flash Lite", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen 3 235B A22B Thinking 2507", + "display_name": "Qwen 3 235B A22B Thinking 2507", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -134817,37 +143668,43 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-05-07", - "last_updated": "2026-05-07", + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-04-29", + "last_updated": "2026-03-12", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "input": 0.45, + "output": 3.5 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-thinking", - "name": "Qwen3-Next 80B-A3B (Thinking)", - "display_name": "Qwen3-Next 80B-A3B (Thinking)", + "id": "google-gemma-4-26b-a4b-it", + "name": "Google Gemma 4 26B A4B Instruct", + "display_name": "Google Gemma 4 26B A4B Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -134855,43 +143712,64 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", + "release_date": "2026-04-02", + "last_updated": "2026-04-12", "cost": { - "input": 0.5, - "output": 6 + "input": 0.1625, + "output": 0.5 }, "type": "chat" }, { - "id": "grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "openai-gpt-4o-2024-11-20", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ + "text", + "image" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-28", + "last_updated": "2026-03-06", + "cost": { + "input": 3.125, + "output": 12.5 + }, + "type": "chat" + }, + { + "id": "openai-gpt-54", + "name": "GPT-5.4", + "display_name": "GPT-5.4", + "modalities": { + "input": [ + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 1000000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -134899,27 +143777,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "release_date": "2026-03-05", + "last_updated": "2026-03-09", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 3.13, + "output": 18.8, + "cache_read": 0.313 }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", @@ -134930,10 +143802,10 @@ ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -134943,39 +143815,45 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", "effort_options": [ - "none", "low", "medium", "high" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-16", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 6, + "output": 30, + "cache_read": 0.6, + "cache_write": 7.5 }, "type": "chat" }, { - "id": "gemma-3-4b-it", - "name": "Gemma 3 4B", - "display_name": "Gemma 3 4B", + "id": "venice-uncensored-role-play", + "name": "Venice Role Play Uncensored", + "display_name": "Venice Role Play Uncensored", "modalities": { "input": [ "text", @@ -134986,29 +143864,28 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "release_date": "2026-02-20", + "last_updated": "2026-03-16", "cost": { - "input": 0, - "output": 0 + "input": 0.5, + "output": 2 }, "type": "chat" }, { - "id": "kimi-k2-thinking-turbo", - "name": "Kimi K2 Thinking Turbo", - "display_name": "Kimi K2 Thinking Turbo", + "id": "zai-org-glm-5-1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ "text" @@ -135018,8 +143895,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 24000 }, "temperature": true, "tool_call": true, @@ -135040,35 +143917,32 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "release_date": "2026-04-07", + "last_updated": "2026-04-08", "cost": { - "input": 1.15, - "output": 8, - "cache_read": 0.15 + "input": 1.75, + "output": 5.5, + "cache_read": 0.325 }, "type": "chat" }, { - "id": "o1", - "name": "o1", - "display_name": "o1", + "id": "zai-org-glm-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 198000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -135077,44 +143951,44 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-24", + "last_updated": "2026-03-12", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.55, + "output": 2.65, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "gemini-3-1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -135122,23 +143996,38 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "release_date": "2026-02-19", + "last_updated": "2026-03-12", "cost": { - "input": 0.2, - "output": 1.1, - "cache_read": 0.03, - "cache_write": 0 + "input": 2.5, + "output": 15, + "cache_read": 0.5, + "cache_write": 0.5, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + } }, "type": "chat" }, { - "id": "gpt-5.4-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "kimi-k2-5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", @@ -135149,10 +144038,10 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 256000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -135161,38 +144050,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2024-04", + "release_date": "2026-01-27", + "last_updated": "2026-04-30", "cost": { - "input": 30, - "output": 180 + "input": 0.56, + "output": 3.5, + "cache_read": 0.22 }, "type": "chat" }, { - "id": "gpt-3.5-turbo", - "name": "GPT-3.5-turbo", - "display_name": "GPT-3.5-turbo", + "id": "aion-labs-aion-2-0", + "name": "Aion 2.0", + "display_name": "Aion 2.0", "modalities": { "input": [ "text" @@ -135202,30 +144083,30 @@ ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2021-09-01", - "release_date": "2023-03-01", - "last_updated": "2023-11-06", + "release_date": "2026-03-24", + "last_updated": "2026-04-12", "cost": { - "input": 0.5, - "output": 1.5, - "cache_read": 1.25 + "input": 1, + "output": 2, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "qwen3-next-80b", + "name": "Qwen 3 Next 80b", + "display_name": "Qwen 3 Next 80b", "modalities": { "input": [ "text" @@ -135235,45 +144116,29 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 256000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-04-29", + "last_updated": "2026-03-12", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.35, + "output": 1.9 }, "type": "chat" }, { - "id": "qwen-vl-max", - "name": "Qwen-VL Max", - "display_name": "Qwen-VL Max", + "id": "z-ai-glm-5v-turbo", + "name": "GLM 5V Turbo", + "display_name": "GLM 5V Turbo", "modalities": { "input": [ "text", @@ -135284,29 +144149,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-04-08", - "last_updated": "2025-08-13", + "release_date": "2026-04-01", + "last_updated": "2026-04-12", "cost": { - "input": 0.8, - "output": 3.2 + "input": 1.5, + "output": 5, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "sonar", - "name": "Sonar", - "display_name": "Sonar", + "id": "openai-gpt-oss-120b", + "name": "OpenAI GPT OSS 120B", + "display_name": "OpenAI GPT OSS 120B", "modalities": { "input": [ "text" @@ -135317,28 +144183,69 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-11-06", + "last_updated": "2026-05-06", + "cost": { + "input": 0.07, + "output": 0.3 + }, + "type": "chat" + }, + { + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 198000, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "release_date": "2025-12-06", + "last_updated": "2026-04-12", "cost": { - "input": 1, - "output": 1 + "input": 6, + "output": 30, + "cache_read": 0.6, + "cache_write": 7.5 }, "type": "chat" }, { - "id": "qwen3-coder-flash", - "name": "Qwen3 Coder Flash", - "display_name": "Qwen3 Coder Flash", + "id": "mercury-2", + "name": "Mercury 2", + "display_name": "Mercury 2", "modalities": { "input": [ "text" @@ -135348,29 +144255,30 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 128000, + "output": 50000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2026-02-20", + "last_updated": "2026-04-09", "cost": { - "input": 0.3, - "output": 1.5 + "input": 0.3125, + "output": 0.9375, + "cache_read": 0.03125 }, "type": "chat" }, { - "id": "grok-4-3", - "name": "Grok 4.3", - "display_name": "Grok 4.3", + "id": "openai-gpt-53-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", @@ -135381,8 +144289,8 @@ ] }, "limit": { - "context": 1000000, - "output": 30000 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -135392,24 +144300,19 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-05-01", - "last_updated": "2026-05-01", + "release_date": "2026-02-24", + "last_updated": "2026-03-12", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2, - "context_over_200k": { - "input": 2.5, - "output": 5, - "cache_read": 0.4 - } + "input": 2.19, + "output": 17.5, + "cache_read": 0.219 }, "type": "chat" }, { - "id": "glm-4.5v", - "name": "GLM-4.5V", - "display_name": "GLM-4.5V", + "id": "google-gemma-4-31b-it", + "name": "Google Gemma 4 31B Instruct", + "display_name": "Google Gemma 4 31B Instruct", "modalities": { "input": [ "text", @@ -135421,8 +144324,8 @@ ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -135432,19 +144335,27 @@ }, "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "release_date": "2026-04-03", + "last_updated": "2026-04-12", "cost": { - "input": 0.6, - "output": 1.8 + "input": 0.175, + "output": 0.5 }, "type": "chat" - }, + } + ] + }, + "fireworks-ai": { + "id": "fireworks-ai", + "name": "Fireworks AI", + "display_name": "Fireworks AI", + "api": "https://api.fireworks.ai/inference/v1/", + "doc": "https://fireworks.ai/docs/", + "models": [ { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "accounts/fireworks/models/minimax-m2p7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ "text" @@ -135454,8 +144365,8 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 196608, + "output": 196608 }, "temperature": true, "tool_call": true, @@ -135476,20 +144387,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2026-04-12", + "last_updated": "2026-04-12", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "accounts/fireworks/models/glm-4p7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ "text" @@ -135499,8 +144409,8 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 198000, + "output": 198000 }, "temperature": true, "tool_call": true, @@ -135510,58 +144420,65 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 3, - "output": 15, - "reasoning": 15, - "cache_read": 0.75 + "input": 0.6, + "output": 2.2, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-instruct", - "name": "Qwen3-Next 80B-A3B Instruct", - "display_name": "Qwen3-Next 80B-A3B Instruct", + "id": "accounts/fireworks/models/qwen3p6-plus", + "name": "Qwen 3.6 Plus", + "display_name": "Qwen 3.6 Plus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-04", + "last_updated": "2026-04-04", "cost": { "input": 0.5, - "output": 2 + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "accounts/fireworks/models/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -135571,40 +144488,41 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", "cost": { - "input": 30, - "output": 60 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "accounts/fireworks/models/kimi-k2p6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -135614,39 +144532,41 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "accounts/fireworks/models/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -135656,44 +144576,34 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.05, + "output": 0.2 }, "type": "chat" }, { - "id": "glm-4.6v", - "name": "GLM-4.6V", - "display_name": "GLM-4.6V", + "id": "accounts/fireworks/models/deepseek-v3p2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 160000, + "output": 160000 }, "temperature": true, "tool_call": true, @@ -135701,34 +144611,44 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "knowledge": "2025-09", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.56, + "output": 1.68, + "cache_read": 0.28 }, "type": "chat" }, { - "id": "claude-opus-4-1-20250805", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "accounts/fireworks/models/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -135736,94 +144656,87 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.6, + "output": 2.5, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "accounts/fireworks/models/glm-4p5", + "name": "GLM 4.5", + "display_name": "GLM 4.5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 131072, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "accounts/fireworks/models/minimax-m2p5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 196608, + "output": 196608 }, "temperature": true, "tool_call": true, @@ -135831,34 +144744,45 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "glm-4.5-flash", - "name": "GLM-4.5-Flash", - "display_name": "GLM-4.5-Flash", + "id": "accounts/fireworks/models/kimi-k2p5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -135866,35 +144790,44 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "qwen3-vl-plus", - "name": "Qwen3-VL Plus", - "display_name": "Qwen3-VL Plus", + "id": "accounts/fireworks/models/minimax-m2p1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 200000, + "output": 200000 }, "temperature": true, "tool_call": true, @@ -135914,33 +144847,31 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.2, - "output": 1.6, - "reasoning": 4.8 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "grok-4-1-fast", - "name": "Grok 4.1 Fast", - "display_name": "Grok 4.1 Fast", + "id": "accounts/fireworks/models/deepseek-v3p1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, @@ -135948,35 +144879,32 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, + "attachment": false, + "open_weights": true, "knowledge": "2025-07", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.56, + "output": 1.68 }, "type": "chat" }, { - "id": "claude-sonnet-4-20250514", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "accounts/fireworks/models/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -135984,23 +144912,25 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "Qwen3-Coder 480B-A35B Instruct", - "display_name": "Qwen3-Coder 480B-A35B Instruct", + "id": "accounts/fireworks/models/glm-4p5-air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", "modalities": { "input": [ "text" @@ -136010,92 +144940,74 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "release_date": "2025-08-01", + "last_updated": "2025-08-01", "cost": { - "input": 1.5, - "output": 7.5 + "input": 0.22, + "output": 0.88 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "accounts/fireworks/models/glm-5", + "name": "GLM 5", + "display_name": "GLM 5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1, + "output": 3.2, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "accounts/fireworks/models/glm-5p1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ "text" @@ -136105,8 +145017,8 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 202800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -136127,20 +145039,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "accounts/fireworks/routers/kimi-k2p5-turbo", + "name": "Kimi K2.5 Turbo", + "display_name": "Kimi K2.5 Turbo", "modalities": { "input": [ "text", @@ -136151,87 +145062,96 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.03 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-20250219", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "accounts/fireworks/models/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", + "interleaved": true, + "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1.74, + "output": 3.48, + "cache_read": 0.15 }, "type": "chat" - }, + } + ] + }, + "alibaba": { + "id": "alibaba", + "name": "alibaba", + "display_name": "alibaba", + "api": "https://dashscope-intl.aliyuncs.com/compatible-mode/v1", + "doc": "https://www.alibabacloud.com/help/en/model-studio/models", + "models": [ { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3-Coder 30B-A3B Instruct", - "display_name": "Qwen3-Coder 30B-A3B Instruct", + "id": "qwen2-5-7b-instruct", + "name": "Qwen2.5 7B Instruct", + "display_name": "Qwen2.5 7B Instruct", "modalities": { "input": [ "text" @@ -136241,8 +145161,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -136251,69 +145171,103 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.45, - "output": 2.25 + "input": 0.175, + "output": 0.7 }, "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "qwen3-livetranslate-flash-realtime", + "name": "Qwen3-LiveTranslate Flash Realtime", + "display_name": "Qwen3-LiveTranslate Flash Realtime", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" + ], + "output": [ + "text", + "audio" + ] + }, + "limit": { + "context": 53248, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", + "cost": { + "input": 10, + "output": 10, + "input_audio": 10, + "output_audio": 38 + }, + "type": "chat" + }, + { + "id": "qwen2-5-vl-72b-instruct", + "name": "Qwen2.5-VL 72B Instruct", + "display_name": "Qwen2.5-VL 72B Instruct", + "modalities": { + "input": [ + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 2.8, + "output": 8.4 }, "type": "chat" }, - { - "id": "mimo-v2-pro", - "name": "MiMo-V2-Pro", - "display_name": "MiMo-V2-Pro", + { + "id": "qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -136334,75 +145288,71 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2, - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0.4, + "output": 2.4, + "reasoning": 2.4 }, "type": "chat" }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "qwen3-vl-plus", + "name": "Qwen3 VL Plus", + "display_name": "Qwen3 VL Plus", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262144, + "output": 32768 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.2, + "output": 1.6, + "reasoning": 4.8 }, "type": "chat" }, { - "id": "gpt-5-pro", - "name": "GPT-5 Pro", - "display_name": "GPT-5 Pro", + "id": "qwen3-vl-235b-a22b", + "name": "Qwen3-VL 235B-A22B", + "display_name": "Qwen3-VL 235B-A22B", "modalities": { "input": [ "text", @@ -136413,10 +145363,10 @@ ] }, "limit": { - "context": 400000, - "output": 272000 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -136425,79 +145375,44 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 15, - "output": 120 + "input": 0.7, + "output": 2.8, + "reasoning": 8.4 }, "type": "chat" }, { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "qwen3.6-27b", + "name": "Qwen3.6 27B", + "display_name": "Qwen3.6 27B", "modalities": { "input": [ "text", "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 16384 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", - "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 - }, - "type": "chat" - }, - { - "id": "minimax-m2.5-highspeed", - "name": "MiniMax-M2.5-highspeed", - "display_name": "MiniMax-M2.5-highspeed", - "modalities": { - "input": [ - "text" + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -136507,25 +145422,29 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-13", - "last_updated": "2026-02-13", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "output": 3.6 }, "type": "chat" }, { - "id": "qwen-turbo", - "name": "Qwen Turbo", - "display_name": "Qwen Turbo", + "id": "qwq-plus", + "name": "QwQ Plus", + "display_name": "QwQ Plus", "modalities": { "input": [ "text" @@ -136535,14 +145454,19 @@ ] }, "limit": { - "context": 1000000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 32768, + "min": 0, + "max": 32768 + } }, "extra_capabilities": { "reasoning": { @@ -136555,177 +145479,166 @@ ] } }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" + }, "attachment": false, "open_weights": false, "knowledge": "2024-04", - "release_date": "2024-11-01", - "last_updated": "2025-04-28", + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "cost": { - "input": 0.05, - "output": 0.2, - "reasoning": 0.5 + "input": 0.8, + "output": 2.4 }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5 (latest)", - "display_name": "Claude Sonnet 4.5 (latest)", + "id": "qwen3-8b", + "name": "Qwen3 8B", + "display_name": "Qwen3 8B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.18, + "output": 0.7, + "reasoning": 2.1 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "qwen3.5-122b-a10b", + "name": "Qwen3.5 122B-A10B", + "display_name": "Qwen3.5 122B-A10B", "modalities": { "input": [ "text", "image", - "audio", "video", - "pdf" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "open_weights": true, + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.4, + "output": 3.2 }, "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 1.2, + "output": 6 }, "type": "chat" }, { - "id": "glm-4.7-flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "qwen3-235b-a22b", + "name": "Qwen3 235B A22B", + "display_name": "Qwen3 235B A22B", "modalities": { "input": [ "text" @@ -136735,40 +145648,53 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.7, + "output": 2.8, + "reasoning": 8.4 }, "type": "chat" }, { - "id": "mimo-v2-flash", - "name": "MiMo-V2-Flash", - "display_name": "MiMo-V2-Flash", + "id": "qwen3.5-397b-a17b", + "name": "Qwen3.5 397B-A17B", + "display_name": "Qwen3.5 397B-A17B", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" @@ -136795,22 +145721,20 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "qwen3.6-max-preview", - "name": "Qwen3.6 Max Preview", - "display_name": "Qwen3.6 Max Preview", + "id": "qwen-flash", + "name": "Qwen Flash", + "display_name": "Qwen Flash", "modalities": { "input": [ "text" @@ -136820,14 +145744,19 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { @@ -136840,201 +145769,152 @@ ] } }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-20", - "last_updated": "2026-04-20", - "cost": { - "input": 1.3, - "output": 7.8, - "cache_read": 0.13, - "cache_write": 1.625 - }, - "type": "chat" - }, - { - "id": "gpt-5-chat-latest", - "name": "GPT-5 Chat (latest)", - "display_name": "GPT-5 Chat (latest)", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 400000, - "output": 128000 - }, - "temperature": true, - "tool_call": false, - "reasoning": { + "search": { "supported": true, - "default": true + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 1.25, - "output": 10 + "input": 0.05, + "output": 0.4 }, "type": "chat" }, { - "id": "claude-opus-4-20250514", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "qwen-omni-turbo-realtime", + "name": "Qwen-Omni Turbo Realtime", + "display_name": "Qwen-Omni Turbo Realtime", "modalities": { "input": [ "text", "image", - "pdf" + "audio" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 32768, + "output": 2048 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-04", + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.27, + "output": 1.07, + "input_audio": 4.44, + "output_audio": 8.89 }, "type": "chat" }, { - "id": "qwen2-5-vl-72b-instruct", - "name": "Qwen2.5-VL 72B Instruct", - "display_name": "Qwen2.5-VL 72B Instruct", + "id": "qwen-mt-turbo", + "name": "Qwen Mt Turbo", + "display_name": "Qwen Mt Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 16384, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, + "open_weights": false, "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 2.8, - "output": 8.4 + "input": 0.16, + "output": 0.49 }, "type": "chat" }, { - "id": "gpt-5.5-pro", - "name": "GPT-5.5 Pro", - "display_name": "GPT-5.5 Pro", + "id": "qwen-turbo", + "name": "Qwen Turbo", + "display_name": "Qwen Turbo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 131072, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", - "cost": { - "input": 30, - "output": 180, - "context_over_200k": { - "input": 60, - "output": 270 + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 } }, - "type": "chat" - }, - { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1047576, - "output": 32768 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2024-11-01", + "last_updated": "2025-04-28", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.05, + "output": 0.2, + "reasoning": 0.5 }, "type": "chat" }, { - "id": "devstral-small-2507", - "name": "Devstral Small", - "display_name": "Devstral Small", + "id": "qwen-max", + "name": "Qwen Max", + "display_name": "Qwen Max", "modalities": { "input": [ "text" @@ -137044,88 +145924,78 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" + }, "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-07-10", - "last_updated": "2025-07-10", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-04-03", + "last_updated": "2025-01-25", "cost": { - "input": 0.1, - "output": 0.3 + "input": 1.6, + "output": 6.4 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "qwen2-5-vl-7b-instruct", + "name": "Qwen2.5-VL 7B Instruct", + "display_name": "Qwen2.5-VL 7B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 0.35, + "output": 1.05 }, "type": "chat" }, { - "id": "gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash Lite", - "display_name": "Gemini 2.0 Flash Lite", + "id": "qwen2-5-32b-instruct", + "name": "Qwen2.5 32B Instruct", + "display_name": "Qwen2.5 32B Instruct", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 131072, "output": 8192 }, "temperature": true, @@ -137133,112 +146003,119 @@ "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.075, - "output": 0.3 + "input": 0.7, + "output": 2.8 }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "qwen3-asr-flash", + "name": "Qwen3-ASR Flash", + "display_name": "Qwen3-ASR Flash", "modalities": { "input": [ - "text", - "image", - "pdf" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 53248, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-09-08", + "last_updated": "2025-09-08", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0.035, + "output": 0.035 }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 0.625, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5 + } }, "type": "chat" }, { - "id": "grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "qwen3-coder-flash", + "name": "Qwen3 Coder Flash", + "display_name": "Qwen3 Coder Flash", "modalities": { "input": [ "text" @@ -137248,8 +146125,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -137258,303 +146135,280 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0.3, + "output": 1.5 }, "type": "chat" }, { - "id": "grok-4-fast-non-reasoning", - "name": "Grok 4 Fast (Non-Reasoning)", - "display_name": "Grok 4 Fast (Non-Reasoning)", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.7, + "output": 2.8, + "reasoning": 8.4 }, "type": "chat" }, { - "id": "sonar-reasoning-pro", - "name": "Sonar Reasoning Pro", - "display_name": "Sonar Reasoning Pro", + "id": "qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 2, - "output": 8 + "input": 0.5, + "output": 6 }, "type": "chat" - } - ] - }, - "google-vertex": { - "id": "google-vertex", - "name": "Vertex", - "display_name": "Vertex", - "doc": "https://cloud.google.com/vertex-ai/generative-ai/docs/models", - "models": [ + }, { - "id": "gemini-2.0-flash", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "qwen-mt-plus", + "name": "Qwen Mt Plus", + "display_name": "Qwen Mt Plus", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 16384, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2024-04", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.025 + "input": 2.46, + "output": 7.37 }, "type": "chat" }, { - "id": "gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "qwen-vl-plus", + "name": "Qwen-VL Plus", + "display_name": "Qwen-VL Plus", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-08-15", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.21, + "output": 0.63 }, "type": "chat" }, { - "id": "gemini-flash-latest", - "name": "Gemini Flash Latest", - "display_name": "Gemini Flash Latest", + "id": "qwen-omni-turbo", + "name": "Qwen-Omni Turbo", + "display_name": "Qwen-Omni Turbo", "modalities": { "input": [ "text", "image", "audio", - "video", - "pdf" + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 32768, + "output": 2048 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2024-04", + "release_date": "2025-01-19", + "last_updated": "2025-03-26", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.383 + "input": 0.07, + "output": 0.27, + "input_audio": 4.44, + "output_audio": 8.89 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-06-17", - "name": "Gemini 2.5 Flash Lite Preview 06-17", - "display_name": "Gemini 2.5 Flash Lite Preview 06-17", + "id": "qwen3-vl-30b-a3b", + "name": "Qwen3-VL 30B-A3B", + "display_name": "Qwen3-VL 30B-A3B", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.2, + "output": 0.8, + "reasoning": 2.4 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "qwen3.5-35b-a3b", + "name": "Qwen3.5 35B-A3B", + "display_name": "Qwen3.5 35B-A3B", "modalities": { "input": [ "text", "image", - "audio", "video", - "pdf" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, @@ -137566,54 +146420,74 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, + "open_weights": true, + "release_date": "2026-02-23", + "last_updated": "2026-02-23", + "cost": { + "input": 0.25, + "output": 2 + }, + "type": "chat" + }, + { + "id": "qwen-vl-ocr", + "name": "Qwen Vl Ocr", + "display_name": "Qwen Vl Ocr", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 34096, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2024-04", + "release_date": "2024-10-28", + "last_updated": "2025-04-13", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.383 + "input": 0.72, + "output": 0.72 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-09-2025", - "name": "Gemini 2.5 Flash Preview 09-25", - "display_name": "Gemini 2.5 Flash Preview 09-25", + "id": "qwen3.6-35b-a3b", + "name": "Qwen3.6 35B-A3B", + "display_name": "Qwen3.6 35B-A3B", "modalities": { "input": [ "text", "image", - "audio", "video", - "pdf" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, @@ -137625,51 +146499,43 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "open_weights": true, + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.383 + "input": 0.248, + "output": 1.485 }, "type": "chat" }, { - "id": "zai-org/glm-5-maas", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "qwen3-omni-flash", + "name": "Qwen3-Omni Flash", + "display_name": "Qwen3-Omni Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 65536, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -137689,135 +146555,122 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.1 + "input": 0.43, + "output": 1.66, + "input_audio": 3.81, + "output_audio": 15.11 }, "type": "chat" }, { - "id": "zai-org/glm-4.7-maas", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "qwen2-5-14b-instruct", + "name": "Qwen2.5 14B Instruct", + "display_name": "Qwen2.5 14B Instruct", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-06", - "last_updated": "2026-01-06", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0.35, + "output": 1.4 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-v3.2-maas", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "qwen2-5-72b-instruct", + "name": "Qwen2.5 72B Instruct", + "display_name": "Qwen2.5 72B Instruct", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-17", - "last_updated": "2026-04-04", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.56, - "output": 1.68, - "cache_read": 0.056 + "input": 1.4, + "output": 5.6 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-v3.1-maas", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "Qwen3-Coder 480B-A35B Instruct", + "display_name": "Qwen3-Coder 480B-A35B Instruct", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 32768 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.6, - "output": 1.7 + "input": 1.5, + "output": 7.5 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b-maas", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "qvq-max", + "name": "QVQ Max", + "display_name": "QVQ Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -137825,7 +146678,7 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -137834,19 +146687,20 @@ "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0.09, - "output": 0.36 + "input": 1.2, + "output": 4.8 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b-maas", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "qwen3.6-max-preview", + "name": "Qwen3.6 Max Preview", + "display_name": "Qwen3.6 Max Preview", "modalities": { "input": [ "text" @@ -137856,8 +146710,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -137865,20 +146719,34 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-04-20", + "last_updated": "2026-04-20", "cost": { - "input": 0.07, - "output": 0.25 + "input": 1.3, + "output": 7.8, + "cache_read": 0.13, + "cache_write": 1.625 }, "type": "chat" }, { - "id": "meta/llama-3.3-70b-instruct-maas", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder 30B-A3B Instruct", + "display_name": "Qwen3-Coder 30B-A3B Instruct", "modalities": { "input": [ "text" @@ -137888,8 +146756,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -137898,52 +146766,57 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.72, - "output": 0.72 + "input": 0.45, + "output": 2.25 }, "type": "chat" }, { - "id": "meta/llama-4-maverick-17b-128e-instruct-maas", - "name": "Llama 4 Maverick 17B 128E Instruct", - "display_name": "Llama 4 Maverick 17B 128E Instruct", + "id": "qwen3-omni-flash-realtime", + "name": "Qwen3-Omni Flash Realtime", + "display_name": "Qwen3-Omni Flash Realtime", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 524288, - "output": 8192 + "context": 65536, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.35, - "output": 1.15 + "input": 0.52, + "output": 1.99, + "input_audio": 4.57, + "output_audio": 18.13 }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-instruct-2507-maas", - "name": "Qwen3 235B A22B Instruct", - "display_name": "Qwen3 235B A22B Instruct", + "id": "qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ "text" @@ -137953,32 +146826,35 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-13", - "last_updated": "2025-08-13", + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 0.22, - "output": 0.88 + "input": 0.5, + "output": 2 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking-maas", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "qwen3.5-27b", + "name": "Qwen3.5 27B", + "display_name": "Qwen3.5 27B", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" @@ -137986,7 +146862,7 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -138005,781 +146881,563 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 0.6, - "output": 2.5 + "input": 0.3, + "output": 2.4 }, "type": "chat" }, { - "id": "gemini-flash-lite-latest", - "name": "Gemini Flash-Lite Latest", - "display_name": "Gemini Flash-Lite Latest", + "id": "qwen-vl-max", + "name": "Qwen-VL Max", + "display_name": "Qwen-VL Max", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2024-04", + "release_date": "2024-04-08", + "last_updated": "2025-08-13", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.8, + "output": 3.2 }, "type": "chat" }, { - "id": "gemini-2.5-pro-preview-05-06", - "name": "Gemini 2.5 Pro Preview 05-06", - "display_name": "Gemini 2.5 Pro Preview 05-06", + "id": "qwen-plus-character-ja", + "name": "Qwen Plus Character (Japanese)", + "display_name": "Qwen Plus Character (Japanese)", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 8192, + "output": 512 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-06", - "last_updated": "2025-05-06", + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 + "input": 0.5, + "output": 1.4 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview-customtools", - "name": "Gemini 3.1 Pro Preview Custom Tools", - "display_name": "Gemini 3.1 Pro Preview Custom Tools", + "id": "qwen2-5-omni-7b", + "name": "Qwen2.5-Omni 7B", + "display_name": "Qwen2.5-Omni 7B", "modalities": { "input": [ "text", "image", - "video", "audio", - "pdf" + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 32768, + "output": 2048 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-12", + "last_updated": "2024-12", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.1, + "output": 0.4, + "input_audio": 6.76 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-09-2025", - "name": "Gemini 2.5 Flash Lite Preview 09-25", - "display_name": "Gemini 2.5 Flash Lite Preview 09-25", + "id": "qwen-plus", + "name": "Qwen Plus", + "display_name": "Qwen Plus", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-09-11", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.4, + "output": 1.2, + "reasoning": 4 }, "type": "chat" }, { - "id": "gemini-3.1-flash-lite-preview", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 1000000, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "qwen3-14b", + "name": "Qwen3 14B", + "display_name": "Qwen3 14B", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.35, + "output": 1.4, + "reasoning": 4.2 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "qwen3-coder-plus-2025-09-23", + "name": "Qwen3 Coder Plus 2025 09 23", + "display_name": "Qwen3 Coder Plus 2025 09 23", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 1000000, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", - "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "context_over_200k": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 - } + "supported": false }, + "attachment": false, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-05-20", - "name": "Gemini 2.5 Flash Preview 05-20", - "display_name": "Gemini 2.5 Flash Preview 05-20", + "id": "qwen3-coder-plus-2025-07-22", + "name": "Qwen3 Coder Plus 2025 07 22", + "display_name": "Qwen3 Coder Plus 2025 07 22", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 1000000, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", - "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.0375 + "supported": false }, + "attachment": false, "type": "chat" }, { - "id": "gemini-embedding-001", - "name": "Gemini Embedding 001", - "display_name": "Gemini Embedding 001", + "id": "qwen-vl-ocr-latest", + "name": "Qwen Vl Ocr Latest", + "display_name": "Qwen Vl Ocr Latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 2048, - "output": 3072 + "context": 34096, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", - "cost": { - "input": 0.15, - "output": 0 - }, - "type": "embedding" + "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "qvq-max-2025-05-15", + "name": "Qvq Max 2025 05 15", + "display_name": "Qvq Max 2025 05 15", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "default": false, + "budget": { + "default": 16384, + "min": 0, + "max": 16384 } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "attachment": false, + "type": "chat" + }, + { + "id": "qwen-long", + "name": "Qwen Long", + "display_name": "Qwen Long", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 8192 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false }, + "attachment": false, "type": "chat" }, { - "id": "gemini-2.5-pro-preview-06-05", - "name": "Gemini 2.5 Pro Preview 06-05", - "display_name": "Gemini 2.5 Pro Preview 06-05", + "id": "qwen-turbo-latest", + "name": "Qwen Turbo Latest", + "display_name": "Qwen Turbo Latest", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-05", - "last_updated": "2025-06-05", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "gemini-3.1-flash-lite", - "name": "Gemini 3.1 Flash Lite", - "display_name": "Gemini 3.1 Flash Lite", + "id": "qwen-turbo-2024-09-19", + "name": "Qwen Turbo 2024 09 19", + "display_name": "Qwen Turbo 2024 09 19", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-05-07", - "last_updated": "2026-05-07", - "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "supported": false }, + "attachment": false, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-04-17", - "name": "Gemini 2.5 Flash Preview 04-17", - "display_name": "Gemini 2.5 Flash Preview 04-17", + "id": "qwen-flash-2025-07-28", + "name": "Qwen Flash 2025 07 28", + "display_name": "Qwen Flash 2025 07 28", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-04-17", - "last_updated": "2025-04-17", - "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.0375 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "qwen-plus-latest", + "name": "Qwen Plus Latest", + "display_name": "Qwen Plus Latest", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", - "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash Lite", - "display_name": "Gemini 2.0 Flash Lite", + "id": "qwen-plus-2024-09-19", + "name": "Qwen Plus 2024 09 19", + "display_name": "Qwen Plus 2024 09 19", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 131072, "output": 8192 }, "temperature": true, @@ -138787,29 +147445,13 @@ "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", - "cost": { - "input": 0.075, - "output": 0.3 - }, + "attachment": false, "type": "chat" - } - ] - }, - "groq": { - "id": "groq", - "name": "Groq", - "display_name": "Groq", - "doc": "https://console.groq.com/docs/models", - "models": [ + }, { - "id": "gemma2-9b-it", - "name": "Gemma 2 9B", - "display_name": "Gemma 2 9B", + "id": "qwen-plus-2025-07-14", + "name": "Qwen Plus 2025 07 14", + "display_name": "Qwen Plus 2025 07 14", "modalities": { "input": [ "text" @@ -138819,29 +147461,44 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2024-06-27", - "last_updated": "2024-06-27", - "cost": { - "input": 0.2, - "output": 0.2 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "mistral-saba-24b", - "name": "Mistral Saba 24B", - "display_name": "Mistral Saba 24B", + "id": "qwen-plus-2025-09-11", + "name": "Qwen Plus 2025 09 11", + "display_name": "Qwen Plus 2025 09 11", "modalities": { "input": [ "text" @@ -138851,29 +147508,44 @@ ] }, "limit": { - "context": 32768, + "context": 1000000, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-08", - "release_date": "2025-02-06", - "last_updated": "2025-02-06", - "cost": { - "input": 0.79, - "output": 0.79 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "qwen-max-latest", + "name": "Qwen Max Latest", + "display_name": "Qwen Max Latest", "modalities": { "input": [ "text" @@ -138889,29 +147561,21 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", - "cost": { - "input": 0.75, - "output": 0.99 - }, "type": "chat" }, { - "id": "llama-guard-3-8b", - "name": "Llama Guard 3 8B", - "display_name": "Llama Guard 3 8B", + "id": "qwen-max-2024-09-19", + "name": "Qwen Max 2024 09 19", + "display_name": "Qwen Max 2024 09 19", "modalities": { "input": [ "text" @@ -138921,28 +147585,27 @@ ] }, "limit": { - "context": 8192, + "context": 32768, "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 0.2, - "output": 0.2 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "llama-3.3-70b-versatile", - "name": "Llama 3.3 70B Versatile", - "display_name": "Llama 3.3 70B Versatile", + "id": "qwen-max-2024-04-28", + "name": "Qwen Max 2024 04 28", + "display_name": "Qwen Max 2024 04 28", "modalities": { "input": [ "text" @@ -138952,8 +147615,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 8000, + "output": 2000 }, "temperature": true, "tool_call": true, @@ -138961,20 +147624,12 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", - "cost": { - "input": 0.59, - "output": 0.79 - }, "type": "chat" }, { - "id": "allam-2-7b", - "name": "ALLaM-2-7b", - "display_name": "ALLaM-2-7b", + "id": "qwen-max-2024-04-03", + "name": "Qwen Max 2024 04 03", + "display_name": "Qwen Max 2024 04 03", "modalities": { "input": [ "text" @@ -138984,61 +147639,51 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 8000, + "output": 2000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-09", - "last_updated": "2024-09", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "whisper-large-v3", - "name": "Whisper Large V3", - "display_name": "Whisper Large V3", + "id": "qwen-max-2025-01-25", + "name": "Qwen Max 2025 01 25", + "display_name": "Qwen Max 2025 01 25", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 448, - "output": 448 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-09", - "release_date": "2023-09-01", - "last_updated": "2025-09-05", - "cost": { - "input": 0, - "output": 0 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "llama-3.1-8b-instant", - "name": "Llama 3.1 8B Instant", - "display_name": "Llama 3.1 8B Instant", + "id": "qwen3-max-2025-09-23", + "name": "Qwen3 Max 20250923", + "display_name": "Qwen3 Max 20250923", "modalities": { "input": [ "text" @@ -139048,29 +147693,27 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 0.05, - "output": 0.08 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "llama3-70b-8192", - "name": "Llama 3 70B", - "display_name": "Llama 3 70B", + "id": "qwen3-max-preview", + "name": "Qwen3 Max Preview", + "display_name": "Qwen3 Max Preview", "modalities": { "input": [ "text" @@ -139080,29 +147723,38 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-03", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", - "cost": { - "input": 0.59, - "output": 0.79 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "qwen-qwq-32b", - "name": "Qwen QwQ 32B", - "display_name": "Qwen QwQ 32B", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ "text" @@ -139113,61 +147765,61 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-11-27", - "last_updated": "2024-11-27", - "cost": { - "input": 0.29, - "output": 0.39 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "whisper-large-v3-turbo", - "name": "Whisper Large v3 Turbo", - "display_name": "Whisper Large v3 Turbo", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 448, - "output": 448 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-01", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "llama3-8b-8192", - "name": "Llama 3 8B", - "display_name": "Llama 3 8B", + "id": "qwen3-30b-a3b-instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ "text" @@ -139177,8 +147829,8 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -139186,88 +147838,97 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-03", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", - "cost": { - "input": 0.05, - "output": 0.08 - }, "type": "chat" }, { - "id": "canopylabs/orpheus-arabic-saudi", - "name": "Orpheus Arabic Saudi", - "display_name": "Orpheus Arabic Saudi", + "id": "qwen3-30b-a3b-thinking-2507", + "name": "Qwen3 30B A3B Thinking 2507", + "display_name": "Qwen3 30B A3B Thinking 2507", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 4000, - "output": 50000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-12-16", - "release_date": "2025-12-16", - "last_updated": "2025-12-16", - "cost": { - "input": 40, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "canopylabs/orpheus-v1-english", - "name": "Orpheus V1 English", - "display_name": "Orpheus V1 English", + "id": "qwen3-30b-a3b", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 4000, - "output": 50000 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-12-19", - "release_date": "2025-12-19", - "last_updated": "2025-12-19", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "meta-llama/llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout 17B", - "display_name": "Llama 4 Scout 17B", + "id": "qwen3-4b", + "name": "Qwen3 4B", + "display_name": "Qwen3 4B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -139280,23 +147941,32 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", - "cost": { - "input": 0.11, - "output": 0.34 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "meta-llama/llama-prompt-guard-2-22m", - "name": "Llama Prompt Guard 2 22M", - "display_name": "Llama Prompt Guard 2 22M", + "id": "qwen3-1.7b", + "name": "Qwen3 1.7B", + "display_name": "Qwen3 1.7B", "modalities": { "input": [ "text" @@ -139306,61 +147976,79 @@ ] }, "limit": { - "context": 512, - "output": 512 + "context": 32768, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 30720, + "min": 0, + "max": 30720 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-01", - "cost": { - "input": 0.03, - "output": 0.03 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "meta-llama/llama-guard-4-12b", - "name": "Llama Guard 4 12B", - "display_name": "Llama Guard 4 12B", + "id": "qwen3-0.6b", + "name": "Qwen3 0.6B", + "display_name": "Qwen3 0.6B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 1024 + "context": 32768, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 30720, + "min": 0, + "max": 30720 + } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", - "cost": { - "input": 0.2, - "output": 0.2 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "meta-llama/llama-4-maverick-17b-128e-instruct", - "name": "Llama 4 Maverick 17B", - "display_name": "Llama 4 Maverick 17B", + "id": "qwen3-vl-plus-2025-09-23", + "name": "Qwen3 VL Plus 2025 09 23", + "display_name": "Qwen3 VL Plus 2025 09 23", "modalities": { "input": [ "text", @@ -139371,29 +148059,38 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", - "cost": { - "input": 0.2, - "output": 0.6 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "meta-llama/llama-prompt-guard-2-86m", - "name": "Llama Prompt Guard 2 86M", - "display_name": "Llama Prompt Guard 2 86M", + "id": "qwq-plus-latest", + "name": "QwQ Plus Latest", + "display_name": "QwQ Plus Latest", "modalities": { "input": [ "text" @@ -139403,40 +148100,63 @@ ] }, "limit": { - "context": 512, - "output": 512 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": false, "reasoning": { + "supported": true, + "default": true, + "budget": { + "default": 32768, + "min": 0, + "max": 32768 + } + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-01", - "cost": { - "input": 0.04, - "output": 0.04 - }, "type": "chat" - }, + } + ] + }, + "302ai": { + "id": "302ai", + "name": "302.AI", + "display_name": "302.AI", + "api": "https://api.302.ai/v1", + "doc": "https://doc.302.ai", + "models": [ { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "claude-opus-4-1-20250805", + "name": "claude-opus-4-1-20250805", + "display_name": "claude-opus-4-1-20250805", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -139444,69 +148164,67 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", "release_date": "2025-08-05", "last_updated": "2025-08-05", "cost": { - "input": 0.075, - "output": 0.3 + "input": 15, + "output": 75 }, "type": "chat" }, { - "id": "openai/gpt-oss-safeguard-20b", - "name": "Safety GPT OSS 20B", - "display_name": "Safety GPT OSS 20B", + "id": "mistral-large-2512", + "name": "mistral-large-2512", + "display_name": "mistral-large-2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 128000, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-03-05", - "last_updated": "2025-03-05", + "attachment": true, + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 0.075, - "output": 0.3, - "cache_read": 0.037 + "input": 1.1, + "output": 3.3 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "claude-haiku-4-5", + "name": "claude-haiku-4-5", + "display_name": "claude-haiku-4-5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -139519,20 +148237,21 @@ "supported": true } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-16", + "last_updated": "2025-10-16", "cost": { - "input": 0.15, - "output": 0.6 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "qwen/qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -139542,74 +148261,66 @@ ] }, "limit": { - "context": 131072, - "output": 40960 + "context": 1000000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-11-08", - "release_date": "2024-12-23", - "last_updated": "2024-12-23", + "open_weights": false, + "release_date": "2025-12-19", + "last_updated": "2025-12-19", "cost": { - "input": 0.29, - "output": 0.59 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "groq/compound", - "name": "Compound", - "display_name": "Compound", + "id": "chatgpt-4o-latest", + "name": "chatgpt-4o-latest", + "display_name": "chatgpt-4o-latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09-04", - "release_date": "2025-09-04", - "last_updated": "2025-09-04", + "knowledge": "2023-09", + "release_date": "2024-08-08", + "last_updated": "2024-08-08", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 15 }, "type": "chat" }, { - "id": "groq/compound-mini", - "name": "Compound Mini", - "display_name": "Compound Mini", + "id": "glm-5.1", + "name": "glm-5.1", + "display_name": "glm-5.1", "modalities": { "input": [ "text" @@ -139619,8 +148330,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -139628,31 +148339,43 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": false, - "knowledge": "2025-09-04", - "release_date": "2025-09-04", - "last_updated": "2025-09-04", + "release_date": "2026-04-10", + "last_updated": "2026-04-10", "cost": { - "input": 0, - "output": 0 + "input": 0.86, + "output": 3.5 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "gpt-4o", + "name": "gpt-4o", + "display_name": "gpt-4o", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 128000, "output": 16384 }, "temperature": true, @@ -139660,93 +148383,68 @@ "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-14", - "last_updated": "2025-07-14", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 1, - "output": 3 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-instruct-0905", - "name": "Kimi K2 Instruct 0905", - "display_name": "Kimi K2 Instruct 0905", + "id": "glm-5v-turbo", + "name": "GLM-5V-Turbo", + "display_name": "GLM-5V-Turbo", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", - "cost": { - "input": 1, - "output": 3 - }, - "type": "chat" - } - ] - }, - "azure": { - "id": "azure", - "name": "Azure", - "display_name": "Azure", - "doc": "https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models", - "models": [ - { - "id": "mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 128000 + "supported": true, + "default": true }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.72, + "output": 3.2 }, "type": "chat" }, { - "id": "gpt-5.2-chat", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", + "id": "gemini-3-pro-image-preview", + "name": "gemini-3-pro-image-preview", + "display_name": "gemini-3-pro-image-preview", "modalities": { "input": [ "text", @@ -139757,34 +148455,52 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 64000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2025-06", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 2, + "output": 120 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "codex-mini", - "name": "Codex Mini", - "display_name": "Codex Mini", + "id": "claude-3-5-haiku-latest", + "name": "claude-3-5-haiku-latest", + "display_name": "claude-3-5-haiku-latest", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -139792,65 +148508,84 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-16", - "last_updated": "2025-05-16", + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 1.5, - "output": 6, - "cache_read": 0.375 + "input": 0.8, + "output": 4 }, "type": "chat" }, { - "id": "phi-4-multimodal", - "name": "Phi-4-multimodal", - "display_name": "Phi-4-multimodal", + "id": "gpt-5.2", + "name": "gpt-5.2", + "display_name": "gpt-5.2", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-12", + "last_updated": "2025-12-12", "cost": { - "input": 0.08, - "output": 0.32, - "input_audio": 4 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "phi-3.5-mini-instruct", - "name": "Phi-3.5-mini-instruct", - "display_name": "Phi-3.5-mini-instruct", + "id": "deepseek-chat", + "name": "Deepseek-Chat", + "display_name": "Deepseek-Chat", "modalities": { "input": [ "text" @@ -139861,28 +148596,28 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-11-29", + "last_updated": "2024-11-29", "cost": { - "input": 0.13, - "output": 0.52 + "input": 0.29, + "output": 0.43 }, "type": "chat" }, { - "id": "llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout 17B 16E Instruct", - "display_name": "Llama 4 Scout 17B 16E Instruct", + "id": "gpt-5-thinking", + "name": "gpt-5-thinking", + "display_name": "gpt-5-thinking", "modalities": { "input": [ "text", @@ -139893,29 +148628,30 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 0.2, - "output": 0.78 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "grok-4-1-fast-reasoning", - "name": "Grok 4.1 Fast (Reasoning)", - "display_name": "Grok 4.1 Fast (Reasoning)", + "id": "gemini-2.5-flash-preview-09-2025", + "name": "gemini-2.5-flash-preview-09-2025", + "display_name": "gemini-2.5-flash-preview-09-2025", "modalities": { "input": [ "text", @@ -139926,8 +148662,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -139937,162 +148673,162 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-06-27", - "last_updated": "2025-06-27", + "knowledge": "2025-01", + "release_date": "2025-09-26", + "last_updated": "2025-09-26", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "phi-3-medium-4k-instruct", - "name": "Phi-3-medium-instruct (4k)", - "display_name": "Phi-3-medium-instruct (4k)", + "id": "claude-haiku-4-5-20251001", + "name": "claude-haiku-4-5-20251001", + "display_name": "claude-haiku-4-5-20251001", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-16", + "last_updated": "2025-10-16", "cost": { - "input": 0.17, - "output": 0.68 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "ministral-3b", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "doubao-seed-code-preview-251028", + "name": "doubao-seed-code-preview-251028", + "display_name": "doubao-seed-code-preview-251028", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-03", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "attachment": true, + "open_weights": false, + "release_date": "2025-11-11", + "last_updated": "2025-11-11", "cost": { - "input": 0.04, - "output": 0.04 + "input": 0.17, + "output": 1.14 }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "gpt-5.4-nano", + "name": "gpt-5.4-nano", + "display_name": "gpt-5.4-nano", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", - "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 - }, - "type": "chat" - }, - { - "id": "meta-llama-3.1-8b-instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2025-08-31", + "release_date": "2026-03-19", + "last_updated": "2026-03-19", "cost": { - "input": 0.3, - "output": 0.61 + "input": 0.2, + "output": 1.25 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "gemini-2.5-pro", + "name": "gemini-2.5-pro", + "display_name": "gemini-2.5-pro", "modalities": { "input": [ "text", @@ -140103,8 +148839,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -140115,29 +148851,37 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, + "attachment": true, + "open_weights": false, "knowledge": "2025-01", - "release_date": "2026-02-06", - "last_updated": "2026-02-06", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.6, - "output": 3 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "kimi-k2-0905-preview", + "name": "kimi-k2-0905-preview", + "display_name": "kimi-k2-0905-preview", "modalities": { "input": [ "text" @@ -140147,8 +148891,8 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -140156,154 +148900,180 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.71, - "output": 0.71 + "input": 0.632, + "output": 2.53 }, "type": "chat" }, { - "id": "deepseek-v3-0324", - "name": "DeepSeek-V3-0324", - "display_name": "DeepSeek-V3-0324", + "id": "grok-4-1-fast-reasoning", + "name": "grok-4-1-fast-reasoning", + "display_name": "grok-4-1-fast-reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "cost": { - "input": 1.14, - "output": 4.56 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "gpt-5-chat", - "name": "GPT-5 Chat", - "display_name": "GPT-5 Chat", + "id": "MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 204800, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2024-10-24", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2026-03-19", + "last_updated": "2026-03-19", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "phi-3.5-moe-instruct", - "name": "Phi-3.5-MoE-instruct", - "display_name": "Phi-3.5-MoE-instruct", + "id": "grok-4.20-multi-agent-beta-0309", + "name": "grok-4.20-multi-agent-beta-0309", + "display_name": "grok-4.20-multi-agent-beta-0309", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 2000000, + "output": 30000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0.16, - "output": 0.64 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "gpt-5.3-chat", - "name": "GPT-5.3 Chat", - "display_name": "GPT-5.3 Chat", + "id": "claude-sonnet-4-5-20250929-thinking", + "name": "claude-sonnet-4-5-20250929-thinking", + "display_name": "claude-sonnet-4-5-20250929-thinking", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "knowledge": "2025-03", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "o1-mini", - "name": "o1-mini", - "display_name": "o1-mini", + "id": "deepseek-v3.2", + "name": "deepseek-v3.2", + "display_name": "deepseek-v3.2", "modalities": { "input": [ "text" @@ -140314,139 +149084,138 @@ }, "limit": { "context": 128000, - "output": 65536 + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "knowledge": "2024-12", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.29, + "output": 0.43 }, "type": "chat" }, { - "id": "text-embedding-3-large", - "name": "text-embedding-3-large", - "display_name": "text-embedding-3-large", + "id": "grok-4-1-fast-non-reasoning", + "name": "grok-4-1-fast-non-reasoning", + "display_name": "grok-4-1-fast-non-reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8191, - "output": 3072 + "context": 2000000, + "output": 30000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "knowledge": "2025-06", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "cost": { - "input": 0.13, - "output": 0 + "input": 0.2, + "output": 0.5 }, - "type": "embedding" + "type": "chat" }, { - "id": "phi-3-mini-128k-instruct", - "name": "Phi-3-mini-instruct (128k)", - "display_name": "Phi-3-mini-instruct (128k)", + "id": "doubao-seed-1-6-vision-250815", + "name": "doubao-seed-1-6-vision-250815", + "display_name": "doubao-seed-1-6-vision-250815", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "attachment": true, + "open_weights": false, + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.13, - "output": 0.52 + "input": 0.114, + "output": 1.143 }, "type": "chat" }, { - "id": "phi-4-reasoning", - "name": "Phi-4-reasoning", - "display_name": "Phi-4-reasoning", + "id": "claude-sonnet-4-5", + "name": "claude-sonnet-4-5", + "display_name": "claude-sonnet-4-5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.125, - "output": 0.5 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "grok-4.20-beta-0309-reasoning", + "name": "grok-4.20-beta-0309-reasoning", + "display_name": "grok-4.20-beta-0309-reasoning", "modalities": { "input": [ "text", @@ -140457,10 +149226,10 @@ ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 2000000, + "output": 30000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -140468,41 +149237,23 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "claude-opus-4-1-20250805-thinking", + "name": "claude-opus-4-1-20250805-thinking", + "display_name": "claude-opus-4-1-20250805-thinking", "modalities": { "input": [ "text", @@ -140513,10 +149264,10 @@ ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 200000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -140525,40 +149276,24 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "default_enabled": true } }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-03", + "release_date": "2025-05-27", + "last_updated": "2025-05-27", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 + "input": 15, + "output": 75 }, "type": "chat" }, { - "id": "meta-llama-3-70b-instruct", - "name": "Meta-Llama-3-70B-Instruct", - "display_name": "Meta-Llama-3-70B-Instruct", + "id": "qwen-max-latest", + "name": "Qwen-Max-Latest", + "display_name": "Qwen-Max-Latest", "modalities": { "input": [ "text" @@ -140568,29 +149303,29 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2024-04-03", + "last_updated": "2025-01-25", "cost": { - "input": 2.68, - "output": 3.54 + "input": 0.343, + "output": 1.372 }, "type": "chat" }, { - "id": "phi-3-small-8k-instruct", - "name": "Phi-3-small-instruct (8k)", - "display_name": "Phi-3-small-instruct (8k)", + "id": "glm-4.7-flashx", + "name": "glm-4.7-flashx", + "display_name": "glm-4.7-flashx", "modalities": { "input": [ "text" @@ -140600,43 +149335,45 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 200000, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2025-04", + "release_date": "2026-01-20", + "last_updated": "2026-01-20", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.0715, + "output": 0.429 }, "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "claude-opus-4-6-thinking", + "name": "claude-opus-4-6-thinking", + "display_name": "claude-opus-4-6-thinking", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -140646,39 +149383,43 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, "effort": "medium", "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "knowledge": "2025-05", + "release_date": "2026-02-06", + "last_updated": "2026-03-13", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 5, + "output": 25 }, "type": "chat" }, { - "id": "text-embedding-ada-002", - "name": "text-embedding-ada-002", - "display_name": "text-embedding-ada-002", + "id": "glm-4.5-airx", + "name": "glm-4.5-airx", + "display_name": "glm-4.5-airx", "modalities": { "input": [ "text" @@ -140687,61 +149428,30 @@ "text" ] }, - "limit": { - "context": 8192, - "output": 1536 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2022-12-15", - "last_updated": "2022-12-15", - "cost": { - "input": 0.1, - "output": 0 - }, - "type": "embedding" - }, - { - "id": "llama-3.2-90b-vision-instruct", - "name": "Llama-3.2-90B-Vision-Instruct", - "display_name": "Llama-3.2-90B-Vision-Instruct", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, "limit": { "context": 128000, - "output": 8192 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "attachment": false, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 2.04, - "output": 2.04 + "input": 0.572, + "output": 1.714 }, "type": "chat" }, { - "id": "deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "glm-4.5-air", + "name": "glm-4.5-air", + "display_name": "glm-4.5-air", "modalities": { "input": [ "text" @@ -140751,41 +149461,30 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 131072, + "output": 98304 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 1.35, - "output": 5.4 + "input": 0.1143, + "output": 0.286 }, "type": "chat" }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "Grok 4.1 Fast (Non-Reasoning)", - "display_name": "Grok 4.1 Fast (Non-Reasoning)", + "id": "gpt-5.1-chat-latest", + "name": "gpt-5.1-chat-latest", + "display_name": "gpt-5.1-chat-latest", "modalities": { "input": [ "text", @@ -140797,242 +149496,202 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-27", - "last_updated": "2025-06-27", - "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 - }, - "type": "chat" - }, - { - "id": "deepseek-v3.2-speciale", - "name": "DeepSeek-V3.2-Speciale", - "display_name": "DeepSeek-V3.2-Speciale", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 128000 - }, - "temperature": true, - "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.58, - "output": 1.68 + "input": 1.25, + "output": 10 }, "type": "chat" }, - { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + { + "id": "qwen3-235b-a22b", + "name": "Qwen3-235B-A22B", + "display_name": "Qwen3-235B-A22B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2025-04", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.125 + "input": 0.29, + "output": 2.86 }, "type": "chat" }, { - "id": "mistral-large-2411", - "name": "Mistral Large 24.11", - "display_name": "Mistral Large 24.11", + "id": "glm-4.5v", + "name": "GLM-4.5V", + "display_name": "GLM-4.5V", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 64000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "attachment": true, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-12", + "last_updated": "2025-08-12", "cost": { - "input": 2, - "output": 6 + "input": 0.29, + "output": 0.86 }, "type": "chat" }, { - "id": "claude-opus-4-1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "qwen-flash", + "name": "Qwen-Flash", + "display_name": "Qwen-Flash", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.022, + "output": 0.22 }, "type": "chat" }, { - "id": "cohere-command-a", - "name": "Command A", - "display_name": "Command A", + "id": "gemini-3.1-flash-image-preview", + "name": "gemini-3.1-flash-image-preview", + "display_name": "gemini-3.1-flash-image-preview", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 256000, - "output": 8000 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-27", + "last_updated": "2026-02-27", "cost": { - "input": 2.5, - "output": 10 + "input": 0.5, + "output": 60 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "llama-3.2-11b-vision-instruct", - "name": "Llama-3.2-11B-Vision-Instruct", - "display_name": "Llama-3.2-11B-Vision-Instruct", + "id": "gpt-4.1", + "name": "gpt-4.1", + "display_name": "gpt-4.1", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -141040,20 +149699,20 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.37, - "output": 0.37 + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "meta-llama-3.1-405b-instruct", - "name": "Meta-Llama-3.1-405B-Instruct", - "display_name": "Meta-Llama-3.1-405B-Instruct", + "id": "glm-4.6", + "name": "glm-4.6", + "display_name": "glm-4.6", "modalities": { "input": [ "text" @@ -141063,67 +149722,68 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 5.33, - "output": 16 + "input": 0.286, + "output": 1.142 }, "type": "chat" }, { - "id": "gpt-5.1-chat", - "name": "GPT-5.1 Chat", - "display_name": "GPT-5.1 Chat", + "id": "glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 98304 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.286, + "output": 1.142 }, "type": "chat" }, { - "id": "gpt-4-turbo-vision", - "name": "GPT-4 Turbo Vision", - "display_name": "GPT-4 Turbo Vision", + "id": "ministral-14b-2512", + "name": "ministral-14b-2512", + "display_name": "ministral-14b-2512", "modalities": { "input": [ "text", @@ -141135,7 +149795,7 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 128000 }, "temperature": true, "tool_call": true, @@ -141144,19 +149804,19 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2024-12", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 10, - "output": 30 + "input": 0.33, + "output": 0.33 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "gpt-5.4-nano-2026-03-17", + "name": "gpt-5.4-nano-2026-03-17", + "display_name": "gpt-5.4-nano-2026-03-17", "modalities": { "input": [ "text", @@ -141174,15 +149834,16 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ + "none", "low", "medium", "high", @@ -141197,54 +149858,82 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "release_date": "2026-03-19", + "last_updated": "2026-03-19", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.2, + "output": 1.25 }, "type": "chat" }, { - "id": "cohere-embed-v-4-0", - "name": "Embed v4", - "display_name": "Embed v4", + "id": "claude-sonnet-4-6", + "name": "claude-sonnet-4-6", + "display_name": "claude-sonnet-4-6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 1536 + "context": 1000000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-18", + "last_updated": "2026-03-13", "cost": { - "input": 0.12, - "output": 0 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex Mini", - "display_name": "GPT-5.1 Codex Mini", + "id": "gpt-5-pro", + "name": "gpt-5-pro", + "display_name": "gpt-5-pro", "modalities": { "input": [ "text", @@ -141256,26 +149945,20 @@ }, "limit": { "context": 400000, - "output": 128000 + "output": 272000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], + "default_enabled": true, + "mode": "fixed", + "effort": "high", "verbosity": "medium", "verbosity_options": [ "low", @@ -141285,22 +149968,21 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "release_date": "2025-10-08", + "last_updated": "2025-10-08", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-0125", - "name": "GPT-3.5 Turbo 0125", - "display_name": "GPT-3.5 Turbo 0125", + "id": "deepseek-reasoner", + "name": "Deepseek-Reasoner", + "display_name": "Deepseek-Reasoner", "modalities": { "input": [ "text" @@ -141310,77 +149992,75 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 128000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "knowledge": "2021-08", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.29, + "output": 0.43 }, "type": "chat" }, { - "id": "o1-preview", - "name": "o1-preview", - "display_name": "o1-preview", + "id": "gpt-4.1-mini", + "name": "gpt-4.1-mini", + "display_name": "gpt-4.1-mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 1047576, "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 16.5, - "output": 66, - "cache_read": 8.25 + "input": 0.4, + "output": 1.6 }, "type": "chat" }, { - "id": "cohere-embed-v3-multilingual", - "name": "Embed v3 Multilingual", - "display_name": "Embed v3 Multilingual", + "id": "deepseek-v3.2-thinking", + "name": "DeepSeek-V3.2-Thinking", + "display_name": "DeepSeek-V3.2-Thinking", "modalities": { "input": [ "text" @@ -141390,82 +150070,76 @@ ] }, "limit": { - "context": 512, - "output": 1024 + "context": 128000, + "output": 128000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.1, - "output": 0 + "input": 0.29, + "output": 0.43 }, "type": "chat" }, { - "id": "grok-4-20-non-reasoning", - "name": "Grok 4.20 (Non-Reasoning)", - "display_name": "Grok 4.20 (Non-Reasoning)", + "id": "doubao-seed-1-8-251215", + "name": "doubao-seed-1-8-251215", + "display_name": "doubao-seed-1-8-251215", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 8192 + "context": 224000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "cost": { - "input": 2, - "output": 6 + "input": 0.114, + "output": 0.286 }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "gemini-2.5-flash-lite-preview-09-2025", + "name": "gemini-2.5-flash-lite-preview-09-2025", + "display_name": "gemini-2.5-flash-lite-preview-09-2025", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 1000000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -141475,39 +150149,36 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "knowledge": "2025-01", + "release_date": "2025-09-26", + "last_updated": "2025-09-26", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "grok-4-fast-reasoning", - "name": "Grok 4 Fast (Reasoning)", - "display_name": "Grok 4 Fast (Reasoning)", + "id": "gemini-3-pro-preview", + "name": "gemini-3-pro-preview", + "display_name": "gemini-3-pro-preview", "modalities": { "input": [ "text", @@ -141518,8 +150189,8 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -141529,25 +150200,36 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "knowledge": "2025-06", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 2, + "output": 12 }, "type": "chat" }, { - "id": "o1", - "name": "o1", - "display_name": "o1", + "id": "gpt-5.1", + "name": "gpt-5.1", + "display_name": "gpt-5.1", "modalities": { "input": [ "text", @@ -141558,22 +150240,29 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -141581,181 +150270,160 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "mistral-small-2503", - "name": "Mistral Small 3.1", - "display_name": "Mistral Small 3.1", + "id": "qwen3-max-2025-09-23", + "name": "qwen3-max-2025-09-23", + "display_name": "qwen3-max-2025-09-23", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 258048, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "knowledge": "2025-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.86, + "output": 3.43 }, "type": "chat" }, { - "id": "model-router", - "name": "Model Router", - "display_name": "Model Router", + "id": "gpt-5.4", + "name": "gpt-5.4", + "display_name": "gpt-5.4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1050000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-05-19", - "last_updated": "2025-11-18", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.14, - "output": 0 - }, - "type": "chat" - }, - { - "id": "gpt-3.5-turbo-1106", - "name": "GPT-3.5 Turbo 1106", - "display_name": "GPT-3.5 Turbo 1106", - "modalities": { - "input": [ - "text" + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "cache_write": 0, + "tiers": [ + { + "input": 5, + "output": 22.5, + "tier": { + "type": "context", + "size": 272000 + } + } ], - "output": [ - "text" - ] - }, - "limit": { - "context": 16384, - "output": 16384 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-11-06", - "last_updated": "2023-11-06", - "cost": { - "input": 1, - "output": 2 + "context_over_200k": { + "input": 5, + "output": 22.5 + } }, "type": "chat" }, { - "id": "text-embedding-3-small", - "name": "text-embedding-3-small", - "display_name": "text-embedding-3-small", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8191, - "output": 1536 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", - "cost": { - "input": 0.02, - "output": 0 - }, - "type": "embedding" - }, - { - "id": "deepseek-v3.1", - "name": "DeepSeek-V3.1", - "display_name": "DeepSeek-V3.1", + "id": "claude-3-5-haiku-20241022", + "name": "claude-3-5-haiku-20241022", + "display_name": "claude-3-5-haiku-20241022", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "attachment": true, + "open_weights": false, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.56, - "output": 1.68 + "input": 0.8, + "output": 4 }, "type": "chat" }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "claude-opus-4-5-20251101", + "name": "claude-opus-4-5-20251101", + "display_name": "claude-opus-4-5-20251101", "modalities": { "input": [ "text", @@ -141776,28 +150444,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": true, "open_weights": false, "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "release_date": "2025-11-25", + "last_updated": "2025-11-25", "cost": { "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "output": 25 }, "type": "chat" }, { - "id": "phi-3-mini-4k-instruct", - "name": "Phi-3-mini-instruct (4k)", - "display_name": "Phi-3-mini-instruct (4k)", + "id": "kimi-k2-thinking", + "name": "kimi-k2-thinking", + "display_name": "kimi-k2-thinking", "modalities": { "input": [ "text" @@ -141807,72 +150468,87 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.13, - "output": 0.52 + "input": 0.575, + "output": 2.3 }, "type": "chat" }, { - "id": "meta-llama-3.1-70b-instruct", - "name": "Meta-Llama-3.1-70B-Instruct", - "display_name": "Meta-Llama-3.1-70B-Instruct", + "id": "gemini-2.0-flash-lite", + "name": "gemini-2.0-flash-lite", + "display_name": "gemini-2.0-flash-lite", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 2000000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "attachment": true, + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-06-16", + "last_updated": "2025-06-16", "cost": { - "input": 2.68, - "output": 3.54 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "phi-4-mini-reasoning", - "name": "Phi-4-mini-reasoning", - "display_name": "Phi-4-mini-reasoning", + "id": "claude-opus-4-20250514", + "name": "claude-opus-4-20250514", + "display_name": "claude-opus-4-20250514", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -141880,89 +150556,80 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.075, - "output": 0.3 + "input": 15, + "output": 75 }, "type": "chat" }, { - "id": "gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "gpt-5.4-mini", + "name": "gpt-5.4-mini", + "display_name": "gpt-5.4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", - "cost": { - "input": 60, - "output": 120 - }, - "type": "chat" - }, - { - "id": "meta-llama-3-8b-instruct", - "name": "Meta-Llama-3-8B-Instruct", - "display_name": "Meta-Llama-3-8B-Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 2048 + "supported": true, + "default": false }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-19", + "last_updated": "2026-03-19", "cost": { - "input": 0.3, - "output": 0.61 + "input": 0.75, + "output": 4.5 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "kimi-k2-thinking-turbo", + "name": "kimi-k2-thinking-turbo", + "display_name": "kimi-k2-thinking-turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -141978,115 +150645,89 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.95, - "output": 4 + "input": 1.265, + "output": 9.119 }, "type": "chat" }, { - "id": "gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "claude-sonnet-4-5-20250929", + "name": "claude-sonnet-4-5-20250929", + "display_name": "claude-sonnet-4-5-20250929", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2025-07-31", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "phi-4-mini", - "name": "Phi-4-mini", - "display_name": "Phi-4-mini", + "id": "grok-4.1", + "name": "grok-4.1", + "display_name": "grok-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": true, + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.075, - "output": 0.3 + "input": 2, + "output": 10 }, "type": "chat" }, { - "id": "grok-4-20-reasoning", - "name": "Grok 4.20 (Reasoning)", - "display_name": "Grok 4.20 (Reasoning)", + "id": "qwen3-30b-a3b", + "name": "Qwen3-30B-A3B", + "display_name": "Qwen3-30B-A3B", "modalities": { "input": [ "text" @@ -142096,67 +150737,80 @@ ] }, "limit": { - "context": 262000, + "context": 128000, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "knowledge": "2025-04", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 2, - "output": 6 + "input": 0.11, + "output": 1.08 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-0301", - "name": "GPT-3.5 Turbo 0301", - "display_name": "GPT-3.5 Turbo 0301", + "id": "claude-opus-4-5-20251101-thinking", + "name": "claude-opus-4-5-20251101-thinking", + "display_name": "claude-opus-4-5-20251101-thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-03-01", - "last_updated": "2023-03-01", + "knowledge": "2025-03", + "release_date": "2025-11-25", + "last_updated": "2025-11-25", "cost": { - "input": 1.5, - "output": 2 + "input": 5, + "output": 25 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "claude-opus-4-7", + "name": "claude-opus-4-7", + "display_name": "claude-opus-4-7", "modalities": { "input": [ "text", @@ -142168,7 +150822,7 @@ ] }, "limit": { - "context": 200000, + "context": 1000000, "output": 128000 }, "temperature": true, @@ -142181,38 +150835,48 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", + "mode": "effort", + "effort": "high", "effort_options": [ "low", "medium", - "high" + "high", + "xhigh" ], "interleaved": true, "summaries": true, - "visibility": "summary", "continuation": [ "thinking_blocks" ], "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2026-01-31", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { "input": 5, "output": 25, "cache_read": 0.5, "cache_write": 6.25, + "tiers": [ + { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], "context_over_200k": { "input": 10, "output": 37.5, @@ -142223,41 +150887,9 @@ "type": "chat" }, { - "id": "phi-3-small-128k-instruct", - "name": "Phi-3-small-instruct (128k)", - "display_name": "Phi-3-small-instruct (128k)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 4096 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", - "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" - }, - { - "id": "deepseek-v3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "glm-5-turbo", + "name": "glm-5-turbo", + "display_name": "glm-5-turbo", "modalities": { "input": [ "text" @@ -142267,8 +150899,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -142278,56 +150910,66 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "open_weights": false, + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0.58, - "output": 1.68 + "input": 0.72, + "output": 3.2 }, "type": "chat" }, { - "id": "phi-3-medium-128k-instruct", - "name": "Phi-3-medium-instruct (128k)", - "display_name": "Phi-3-medium-instruct (128k)", + "id": "grok-4.20-beta-0309-non-reasoning", + "name": "grok-4.20-beta-0309-non-reasoning", + "display_name": "grok-4.20-beta-0309-non-reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 2000000, + "output": 30000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0.17, - "output": 0.68 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-0613", - "name": "GPT-3.5 Turbo 0613", - "display_name": "GPT-3.5 Turbo 0613", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "qwen3-235b-a22b-instruct-2507", + "display_name": "qwen3-235b-a22b-instruct-2507", "modalities": { "input": [ "text" @@ -142337,42 +150979,41 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 128000, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-06-13", - "last_updated": "2023-06-13", + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { - "input": 3, - "output": 4 + "input": 0.29, + "output": 1.143 }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "gemini-3-flash-preview", + "name": "gemini-3-flash-preview", + "display_name": "gemini-3-flash-preview", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -142382,58 +151023,38 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" - }, - { - "id": "phi-4", - "name": "Phi-4", - "display_name": "Phi-4", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 4096 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2025-06", + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "cost": { - "input": 0.125, - "output": 0.5 + "input": 0.5, + "output": 3 }, "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "gpt-5.4-pro", + "name": "gpt-5.4-pro", + "display_name": "gpt-5.4-pro", "modalities": { "input": [ "text", @@ -142444,7 +151065,7 @@ ] }, "limit": { - "context": 272000, + "context": 1050000, "output": 128000 }, "temperature": false, @@ -142458,12 +151079,11 @@ "supported": true, "default_enabled": true, "mode": "effort", - "effort": "medium", + "effort": "high", "effort_options": [ - "minimal", - "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -142476,116 +151096,35 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 - }, - "type": "chat" - }, - { - "id": "gpt-4-32k", - "name": "GPT-4 32K", - "display_name": "GPT-4 32K", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32768, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", - "cost": { - "input": 60, - "output": 120 - }, - "type": "chat" - }, - { - "id": "cohere-embed-v3-english", - "name": "Embed v3 English", - "display_name": "Embed v3 English", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 512, - "output": 1024 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.1, - "output": 0 - }, - "type": "chat" - }, - { - "id": "phi-4-reasoning-plus", - "name": "Phi-4-reasoning-plus", - "display_name": "Phi-4-reasoning-plus", - "modalities": { - "input": [ - "text" + "input": 30, + "output": 180, + "cache_read": 0, + "cache_write": 0, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32000, - "output": 4096 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", - "cost": { - "input": 0.125, - "output": 0.5 + "context_over_200k": { + "input": 60, + "output": 270 + } }, "type": "chat" }, { - "id": "mistral-medium-2505", - "name": "Mistral Medium 3", - "display_name": "Mistral Medium 3", + "id": "gpt-5.2-chat-latest", + "name": "gpt-5.2-chat-latest", + "display_name": "gpt-5.2-chat-latest", "modalities": { "input": [ "text", @@ -142597,28 +151136,29 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "knowledge": "2025-08-31", + "release_date": "2025-12-12", + "last_updated": "2025-12-12", "cost": { - "input": 0.4, - "output": 2 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-instruct", - "name": "GPT-3.5 Turbo Instruct", - "display_name": "GPT-3.5 Turbo Instruct", + "id": "MiniMax-M2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ "text" @@ -142628,29 +151168,39 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-09-21", - "last_updated": "2023-09-21", + "release_date": "2026-03-19", + "last_updated": "2026-03-19", "cost": { - "input": 1.5, - "output": 2 + "input": 0.6, + "output": 4.8 }, "type": "chat" }, { - "id": "deepseek-r1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "qwen3-coder-480b-a35b-instruct", + "display_name": "qwen3-coder-480b-a35b-instruct", "modalities": { "input": [ "text" @@ -142660,96 +151210,69 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 1.35, - "output": 5.4 + "input": 0.86, + "output": 3.43 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "gpt-4.1-nano", + "name": "gpt-4.1-nano", + "display_name": "gpt-4.1-nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-12-02", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "gpt-5.4-mini-2026-03-17", + "name": "gpt-5.4-mini-2026-03-17", + "display_name": "gpt-5.4-mini-2026-03-17", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { @@ -142772,7 +151295,8 @@ "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -142783,22 +151307,21 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "knowledge": "2025-08-31", + "release_date": "2026-03-19", + "last_updated": "2026-03-19", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.75, + "output": 4.5 }, "type": "chat" }, { - "id": "codestral-2501", - "name": "Codestral 25.01", - "display_name": "Codestral 25.01", + "id": "MiniMax-M1", + "name": "MiniMax-M1", + "display_name": "MiniMax-M1", "modalities": { "input": [ "text" @@ -142808,8 +151331,8 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -142818,19 +151341,18 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-06-16", + "last_updated": "2025-06-16", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.132, + "output": 1.254 }, "type": "chat" }, { - "id": "llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama 4 Maverick 17B 128E Instruct FP8", - "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", + "id": "gemini-2.5-flash", + "name": "gemini-2.5-flash", + "display_name": "gemini-2.5-flash", "modalities": { "input": [ "text", @@ -142841,62 +151363,83 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.25, - "output": 1 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "mai-ds-r1", - "name": "MAI-DS-R1", - "display_name": "MAI-DS-R1", + "id": "gemini-2.5-flash-image", + "name": "gemini-2.5-flash-image", + "display_name": "gemini-2.5-flash-image", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2025-01", + "release_date": "2025-10-08", + "last_updated": "2025-10-08", "cost": { - "input": 1.35, - "output": 5.4 + "input": 0.3, + "output": 30 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "gpt-5-mini", + "name": "gpt-5-mini", + "display_name": "gpt-5-mini", "modalities": { "input": [ "text", @@ -142914,16 +151457,16 @@ "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", + "minimal", "low", "medium", "high" @@ -142939,20 +151482,19 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2024-05-30", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "claude-opus-4-6", + "name": "claude-opus-4-6", + "display_name": "claude-opus-4-6", "modalities": { "input": [ "text", @@ -142965,7 +151507,7 @@ }, "limit": { "context": 1000000, - "output": 64000 + "output": 128000 }, "temperature": true, "tool_call": true, @@ -143001,244 +151543,169 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", + "knowledge": "2025-05-31", + "release_date": "2026-02-06", "last_updated": "2026-03-13", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 5, + "output": 25 }, "type": "chat" }, { - "id": "gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "doubao-seed-1-6-thinking-250715", + "name": "doubao-seed-1-6-thinking-250715", + "display_name": "doubao-seed-1-6-thinking-250715", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 256000, + "output": 16000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2025-07-15", + "last_updated": "2025-07-15", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 0.121, + "output": 1.21 }, "type": "chat" }, { - "id": "gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "glm-4.7", + "name": "glm-4.7", + "display_name": "glm-4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 10, - "output": 30 + "input": 0.286, + "output": 1.142 }, "type": "chat" }, { - "id": "gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "glm-for-coding", + "name": "glm-for-coding", + "display_name": "glm-for-coding", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "input": 0.086, + "output": 0.343 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 Mini", - "display_name": "GPT-5.4 Mini", + "id": "MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", - "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 - }, - "type": "chat" - }, - { - "id": "cohere-command-r-08-2024", - "name": "Command R", - "display_name": "Command R", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 4000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "open_weights": false, + "release_date": "2025-10-26", + "last_updated": "2025-10-26", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.33, + "output": 1.32 }, "type": "chat" }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "claude-sonnet-4-20250514", + "name": "claude-sonnet-4-20250514", + "display_name": "claude-sonnet-4-20250514", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -143246,102 +151713,83 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "gpt-5.4-nano", - "name": "GPT-5.4 Nano", - "display_name": "GPT-5.4 Nano", + "id": "gemini-2.5-flash-nothink", + "name": "gemini-2.5-flash-nothink", + "display_name": "gemini-2.5-flash-nothink", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2025-01", + "release_date": "2025-06-24", + "last_updated": "2025-06-24", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "glm-4.5-x", + "name": "glm-4.5-x", + "display_name": "glm-4.5-x", "modalities": { "input": [ "text" @@ -143351,36 +151799,29 @@ ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 1.143, + "output": 2.29 }, "type": "chat" }, { - "id": "gpt-5.4-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "grok-4-fast-non-reasoning", + "name": "grok-4-fast-non-reasoning", + "display_name": "grok-4-fast-non-reasoning", "modalities": { "input": [ "text", @@ -143391,54 +151832,29 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 2000000, + "output": 30000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2025-06", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 30, - "output": 180, - "context_over_200k": { - "input": 60, - "output": 270 - } + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "qwen-plus", + "name": "Qwen-Plus", + "display_name": "Qwen-Plus", "modalities": { "input": [ "text" @@ -143448,45 +151864,40 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1000000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "knowledge": "2024-10", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.12, + "output": 1.2 }, "type": "chat" }, { - "id": "grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "glm-5", + "name": "glm-5", + "display_name": "glm-5", "modalities": { "input": [ "text" @@ -143496,8 +151907,8 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -143507,134 +151918,121 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 3, - "output": 15, - "reasoning": 15, - "cache_read": 0.75 + "input": 0.6, + "output": 2.6 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "grok-4-fast-reasoning", + "name": "grok-4-fast-reasoning", + "display_name": "grok-4-fast-reasoning", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 2000000, + "output": 30000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2025-06", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "claude-opus-4-5", + "name": "claude-opus-4-5", + "display_name": "claude-opus-4-5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-03-31", + "release_date": "2025-11-25", + "last_updated": "2025-11-25", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.03 + "input": 5, + "output": 25 }, "type": "chat" }, { - "id": "grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -143642,37 +152040,36 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "attachment": true, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.3, - "output": 0.5, - "reasoning": 0.5, - "cache_read": 0.075 + "input": 0.145, + "output": 0.43 }, "type": "chat" }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "claude-sonnet-4-6-thinking", + "name": "claude-sonnet-4-6-thinking", + "display_name": "claude-sonnet-4-6-thinking", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1000000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -143682,32 +152079,43 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, "effort": "medium", "effort_options": [ "low", "medium", "high" ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2025-08", + "release_date": "2026-02-18", + "last_updated": "2026-03-13", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "gpt-5-pro", - "name": "GPT-5 Pro", - "display_name": "GPT-5 Pro", + "id": "gpt-5", + "name": "gpt-5", + "display_name": "gpt-5", "modalities": { "input": [ "text", @@ -143719,7 +152127,7 @@ }, "limit": { "context": 400000, - "output": 272000 + "output": 128000 }, "temperature": false, "tool_call": true, @@ -143731,8 +152139,14 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "fixed", - "effort": "high", + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], "verbosity": "medium", "verbosity_options": [ "low", @@ -143745,52 +152159,71 @@ "attachment": true, "open_weights": false, "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 15, - "output": 120 + "input": 1.25, + "output": 10 }, "type": "chat" - }, + } + ] + }, + "xpersona": { + "id": "xpersona", + "name": "Xpersona", + "display_name": "Xpersona", + "api": "https://www.xpersona.co/v1", + "doc": "https://www.xpersona.co/docs", + "models": [ { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "xpersona-frieren-coder", + "name": "Xpersona Frieren Coder", + "display_name": "Xpersona Frieren Coder", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "knowledge": "2025-12-30", + "release_date": "2026-05-01", + "last_updated": "2026-05-15", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 1.5, + "output": 6, + "reasoning": 6, + "cache_read": 0.15 }, "type": "chat" - }, + } + ] + }, + "stepfun": { + "id": "stepfun", + "name": "StepFun", + "display_name": "StepFun", + "api": "https://api.stepfun.com/v1", + "doc": "https://platform.stepfun.com/docs/zh/overview/concept", + "models": [ { - "id": "cohere-command-r-plus-08-2024", - "name": "Command R+", - "display_name": "Command R+", + "id": "step-1-32k", + "name": "Step 1 (32K)", + "display_name": "Step 1 (32K)", "modalities": { "input": [ "text" @@ -143800,97 +152233,99 @@ ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2025-01-01", + "last_updated": "2026-02-13", "cost": { - "input": 2.5, - "output": 10 + "input": 2.05, + "output": 9.59, + "cache_read": 0.41 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "step-2-16k", + "name": "Step 2 (16K)", + "display_name": "Step 2 (16K)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 16384, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-06", + "release_date": "2025-01-01", + "last_updated": "2026-02-13", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 5.21, + "output": 16.44, + "cache_read": 1.04 }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "step-3.5-flash-2603", + "name": "Step 3.5 Flash 2603", + "display_name": "Step 3.5 Flash 2603", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0.1, + "output": 0.3, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "step-3.5-flash", + "name": "Step 3.5 Flash", + "display_name": "Step 3.5 Flash", "modalities": { "input": [ "text" @@ -143900,30 +152335,39 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-29", + "last_updated": "2026-02-13", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0.096, + "output": 0.288, + "cache_read": 0.019 }, "type": "chat" - }, + } + ] + }, + "xai": { + "id": "xai", + "name": "xai", + "display_name": "xai", + "doc": "https://docs.x.ai/docs/models", + "models": [ { - "id": "grok-4-fast-non-reasoning", - "name": "Grok 4 Fast (Non-Reasoning)", - "display_name": "Grok 4 Fast (Non-Reasoning)", + "id": "grok-4.20-0309-non-reasoning", + "name": "Grok 4.20 (Non-Reasoning)", + "display_name": "Grok 4.20 (Non-Reasoning)", "modalities": { "input": [ "text", @@ -143944,40 +152388,47 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "release_date": "2026-03-09", + "last_updated": "2026-03-09", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 2, + "output": 6, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 12, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 12, + "cache_read": 0.4 + } }, "type": "chat" - } - ] - }, - "fastrouter": { - "id": "fastrouter", - "name": "FastRouter", - "display_name": "FastRouter", - "api": "https://go.fastrouter.ai/api/v1", - "doc": "https://fastrouter.ai/models", - "models": [ + }, { - "id": "x-ai/grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "grok-4.20-0309-reasoning", + "name": "Grok 4.20 (Reasoning)", + "display_name": "Grok 4.20 (Reasoning)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -143985,66 +152436,71 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2026-03-09", + "last_updated": "2026-03-09", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75, - "cache_write": 15 + "input": 2, + "output": 6, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 12, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 12, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "grok-vision-beta", + "name": "Grok Vision Beta", + "display_name": "Grok Vision Beta", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 8192, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-01-23", - "last_updated": "2025-01-23", + "attachment": true, + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.03, - "output": 0.14 + "input": 5, + "output": 15, + "cache_read": 5 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "grok-2-vision-1212", + "name": "Grok 2 Vision 1212", + "display_name": "Grok 2 Vision 1212", "modalities": { "input": [ "text", @@ -144055,108 +152511,97 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32000, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "search": { + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-08", + "release_date": "2024-08-20", + "last_updated": "2024-12-12", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 2, + "output": 10, + "cache_read": 2 }, "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "grok-imagine-image-quality", + "name": "Grok Imagine Image Quality", + "display_name": "Grok Imagine Image Quality", "modalities": { "input": [ "text", "image" ], + "output": [ + "image" + ] + }, + "limit": { + "context": 1024, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-04", + "last_updated": "2026-05-16", + "type": "chat" + }, + { + "id": "grok-2-1212", + "name": "Grok 2 1212", + "display_name": "Grok 2 1212", + "modalities": { + "input": [ + "text" + ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 120000, + "output": 100000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "search": { + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-08", + "release_date": "2024-12-12", + "last_updated": "2024-12-12", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 2, + "output": 10, + "cache_read": 2 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "grok-beta", + "name": "Grok Beta", + "display_name": "Grok Beta", "modalities": { "input": [ "text" @@ -144167,89 +152612,58 @@ }, "limit": { "context": 131072, - "output": 65536 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.05, - "output": 0.2 + "input": 5, + "output": 15, + "cache_read": 5 }, "type": "chat" }, { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "grok-imagine-video", + "name": "Grok Imagine Video", + "display_name": "Grok Imagine Video", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1024, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, + "release_date": "2026-03", + "last_updated": "2026-05-16", "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "grok-2", + "name": "Grok 2", + "display_name": "Grok 2", "modalities": { "input": [ "text" @@ -144260,121 +152674,103 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.15, - "output": 0.6 + "input": 2, + "output": 10, + "cache_read": 2 }, "type": "chat" }, { - "id": "z-ai/glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "grok-2-vision-latest", + "name": "Grok 2 Vision Latest", + "display_name": "Grok 2 Vision Latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 8192, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "attachment": true, + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-08-20", + "last_updated": "2024-12-12", "cost": { - "input": 0.95, - "output": 3.15 + "input": 2, + "output": 10, + "cache_read": 2 }, "type": "chat" }, { - "id": "qwen/qwen3-coder", - "name": "Qwen3 Coder", - "display_name": "Qwen3 Coder", + "id": "grok-imagine-image", + "name": "Grok Imagine Image", + "display_name": "Grok Imagine Image", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 1024, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", - "cost": { - "input": 0.3, - "output": 1.2 - }, + "attachment": true, + "open_weights": false, + "release_date": "2026-03", + "last_updated": "2026-05-16", "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "grok-4.3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -144384,95 +152780,74 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "release_date": "2026-05-01", + "last_updated": "2026-05-01", "cost": { "input": 1.25, - "output": 10, - "cache_read": 0.31 + "output": 2.5, + "cache_read": 0.2, + "tiers": [ + { + "input": 2.5, + "output": 5, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 5, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "grok-2-vision", + "name": "Grok 2 Vision", + "display_name": "Grok 2 Vision", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 8192, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2024-08", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.0375 + "input": 2, + "output": 10, + "cache_read": 2 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2", - "name": "Kimi K2", - "display_name": "Kimi K2", + "id": "grok-2-latest", + "name": "Grok 2 Latest", + "display_name": "Grok 2 Latest", "modalities": { "input": [ "text" @@ -144483,7 +152858,7 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -144491,20 +152866,21 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-08-20", + "last_updated": "2024-12-12", "cost": { - "input": 0.55, - "output": 2.2 + "input": 2, + "output": 10, + "cache_read": 2 }, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "grok-4.20-multi-agent-0309", + "name": "Grok 4.20 Multi-Agent", + "display_name": "Grok 4.20 Multi-Agent", "modalities": { "input": [ "text", @@ -144515,145 +152891,136 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 2000000, + "output": 30000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2026-03-09", + "last_updated": "2026-03-09", "cost": { "input": 2, - "output": 8, - "cache_read": 0.5 + "output": 6, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 12, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 12, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "grok-3-mini-fast-beta", + "name": "Grok 3 Mini Fast Beta", + "display_name": "Grok 3 Mini Fast Beta", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 120000, + "output": 100000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "effort": "low" }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "search": { + "supported": false }, + "attachment": false, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "grok-3-mini-beta", + "name": "Grok 3 Mini Beta", + "display_name": "Grok 3 Mini Beta", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 120000, + "output": 100000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "effort": "low" }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "search": { + "supported": false }, + "attachment": false, "type": "chat" - } - ] - }, - "stackit": { - "id": "stackit", - "name": "STACKIT", - "display_name": "STACKIT", - "api": "https://api.openai-compat.model-serving.eu01.onstackit.cloud/v1", - "doc": "https://docs.stackit.cloud/products/data-and-ai/ai-model-serving/basics/available-shared-models", - "models": [ + }, { - "id": "Qwen/Qwen3-VL-Embedding-8B", - "name": "Qwen3-VL Embedding 8B", - "display_name": "Qwen3-VL Embedding 8B", + "id": "grok-3-fast-beta", + "name": "Grok 3 Fast Beta", + "display_name": "Grok 3 Fast Beta", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 120000, + "output": 100000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", - "cost": { - "input": 0.09, - "output": 0.09 + "search": { + "supported": false }, + "attachment": false, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-235B-A22B-Instruct-FP8", - "name": "Qwen3-VL 235B", - "display_name": "Qwen3-VL 235B", + "id": "grok-2-image-1212", + "name": "Grok 2 Image 1212", + "display_name": "Grok 2 Image 1212", "modalities": { "input": [ "text", @@ -144664,28 +153031,24 @@ ] }, "limit": { - "context": 218000, - "output": 8192 + "context": 130000, + "output": 100000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2024-11-01", - "last_updated": "2024-11-01", - "cost": { - "input": 1.64, - "output": 1.91 + "search": { + "supported": false }, + "attachment": false, "type": "chat" }, { - "id": "neuralmagic/Meta-Llama-3.1-8B-Instruct-FP8", - "name": "Llama 3.1 8B", - "display_name": "Llama 3.1 8B", + "id": "grok-3-beta", + "name": "Grok 3 Beta", + "display_name": "Grok 3 Beta", "modalities": { "input": [ "text" @@ -144695,28 +153058,33 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 120000, + "output": 100000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 0.16, - "output": 0.27 + "search": { + "supported": false }, + "attachment": false, "type": "chat" - }, + } + ] + }, + "sarvam": { + "id": "sarvam", + "name": "Sarvam AI", + "display_name": "Sarvam AI", + "api": "https://api.sarvam.ai/v1", + "doc": "https://docs.sarvam.ai/api-reference-docs/getting-started/models", + "models": [ { - "id": "neuralmagic/Mistral-Nemo-Instruct-2407-FP8", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "sarvam-30b", + "name": "Sarvam-30B", + "display_name": "Sarvam-30B", "modalities": { "input": [ "text" @@ -144726,28 +153094,36 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", - "cost": { - "input": 0.49, - "output": 0.71 - }, + "release_date": "2026-02-18", + "last_updated": "2026-03-06", "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT-OSS 120B", - "display_name": "GPT-OSS 120B", + "id": "sarvam-105b", + "name": "Sarvam-105B", + "display_name": "Sarvam-105B", "modalities": { "input": [ "text" @@ -144757,8 +153133,8 @@ ] }, "limit": { - "context": 131000, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -144768,23 +153144,34 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 0.49, - "output": 0.71 - }, + "release_date": "2026-02-18", + "last_updated": "2026-03-06", "type": "chat" - }, + } + ] + }, + "zhipuai": { + "id": "zhipuai", + "name": "Zhipu AI", + "display_name": "Zhipu AI", + "api": "https://open.bigmodel.cn/api/paas/v4", + "doc": "https://docs.z.ai/guides/overview/pricing", + "models": [ { - "id": "cortecs/Llama-3.3-70B-Instruct-FP8-Dynamic", - "name": "Llama 3.3 70B", - "display_name": "Llama 3.3 70B", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -144794,60 +153181,90 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "open_weights": false, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.49, - "output": 0.71 + "input": 6, + "output": 24, + "cache_read": 1.3, + "cache_write": 0 }, "type": "chat" }, { - "id": "google/gemma-3-27b-it", - "name": "Gemma 3 27B", - "display_name": "Gemma 3 27B", + "id": "glm-5v-turbo", + "name": "GLM-5V-Turbo", + "display_name": "GLM-5V-Turbo", "modalities": { "input": [ "text", - "image" + "image", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 37000, - "output": 8192 + "context": 200000, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-05-17", - "last_updated": "2025-05-17", + "open_weights": false, + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 0.49, - "output": 0.71 + "input": 5, + "output": 22, + "cache_read": 1.2, + "cache_write": 0 }, "type": "chat" }, { - "id": "intfloat/e5-mistral-7b-instruct", - "name": "E5 Mistral 7B", - "display_name": "E5 Mistral 7B", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -144857,37 +153274,42 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 204800, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2023-12-11", - "last_updated": "2023-12-11", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.02, - "output": 0.02 + "input": 1, + "output": 3.2, + "cache_read": 0.2, + "cache_write": 0 }, "type": "chat" - } - ] - }, - "tencent-coding-plan": { - "id": "tencent-coding-plan", - "name": "Tencent Coding Plan (China)", - "display_name": "Tencent Coding Plan (China)", - "api": "https://api.lkeap.cloud.tencent.com/coding/v3", - "doc": "https://cloud.tencent.com/document/product/1772/128947", - "models": [ + }, { - "id": "kimi-k2.5", - "name": "Kimi-K2.5", - "display_name": "Kimi-K2.5", + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ "text", @@ -144899,7 +153321,7 @@ ] }, "limit": { - "context": 262144, + "context": 128000, "output": 32768 }, "temperature": true, @@ -144908,34 +153330,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -144945,8 +153354,8 @@ ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -144966,21 +153375,22 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, "cache_write": 0 }, "type": "chat" }, { - "id": "hunyuan-turbos", - "name": "Hunyuan-TurboS", - "display_name": "Hunyuan-TurboS", + "id": "glm-4.5-flash", + "name": "GLM-4.5-Flash", + "display_name": "GLM-4.5-Flash", "modalities": { "input": [ "text" @@ -144991,17 +153401,19 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-08", - "last_updated": "2026-03-08", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { "input": 0, "output": 0, @@ -145011,9 +153423,9 @@ "type": "chat" }, { - "id": "hunyuan-t1", - "name": "Hunyuan-T1", - "display_name": "Hunyuan-T1", + "id": "glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -145024,7 +153436,7 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 98304 }, "temperature": true, "tool_call": true, @@ -145032,33 +153444,23 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-08", - "last_updated": "2026-03-08", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, "cache_write": 0 }, "type": "chat" }, { - "id": "hunyuan-2.0-instruct", - "name": "Tencent HY 2.0 Instruct", - "display_name": "Tencent HY 2.0 Instruct", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -145068,30 +153470,37 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-08", - "last_updated": "2026-03-08", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, "cache_write": 0 }, "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ "text" @@ -145101,8 +153510,8 @@ ] }, "limit": { - "context": 204800, - "output": 32768 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -145112,19 +153521,14 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { "input": 0, "output": 0, @@ -145134,9 +153538,44 @@ "type": "chat" }, { - "id": "tc-code-latest", - "name": "Auto", - "display_name": "Auto", + "id": "glm-4.5v", + "name": "GLM-4.5V", + "display_name": "GLM-4.5V", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 64000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", + "cost": { + "input": 0.6, + "output": 1.8 + }, + "type": "chat" + }, + { + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ "text" @@ -145147,29 +153586,31 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-08", - "last_updated": "2026-03-08", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, "cache_write": 0 }, "type": "chat" }, { - "id": "hunyuan-2.0-thinking", - "name": "Tencent HY 2.0 Think", - "display_name": "Tencent HY 2.0 Think", + "id": "glm-4.7-flashx", + "name": "GLM-4.7-FlashX", + "display_name": "GLM-4.7-FlashX", "modalities": { "input": [ "text" @@ -145179,8 +153620,8 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -145188,46 +153629,35 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-08", - "last_updated": "2026-03-08", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, + "input": 0.07, + "output": 0.4, + "cache_read": 0.01, "cache_write": 0 }, "type": "chat" } ] }, - "privatemode-ai": { - "id": "privatemode-ai", - "name": "Privatemode AI", - "display_name": "Privatemode AI", - "api": "http://localhost:8080/v1", - "doc": "https://docs.privatemode.ai/api/overview", + "bailing": { + "id": "bailing", + "name": "Bailing", + "display_name": "Bailing", + "api": "https://api.tbox.cn/api/llm/v1/chat/completions", + "doc": "https://alipaytbox.yuque.com/sxs0ba/ling/intro", "models": [ { - "id": "gemma-3-27b", - "name": "Gemma 3 27B", - "display_name": "Gemma 3 27B", + "id": "Ring-1T", + "name": "Ring-1T", + "display_name": "Ring-1T", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -145235,103 +153665,180 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-03-12", - "last_updated": "2025-03-12", + "knowledge": "2024-06", + "release_date": "2025-10", + "last_updated": "2025-10", "cost": { - "input": 0, - "output": 0 + "input": 0.57, + "output": 2.29 }, "type": "chat" }, { - "id": "whisper-large-v3", - "name": "Whisper large-v3", - "display_name": "Whisper large-v3", + "id": "Ling-1T", + "name": "Ling-1T", + "display_name": "Ling-1T", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 128000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2023-09", - "release_date": "2023-09-01", - "last_updated": "2023-09-01", + "knowledge": "2024-06", + "release_date": "2025-10", + "last_updated": "2025-10", "cost": { - "input": 0, - "output": 0 + "input": 0.57, + "output": 2.29 }, "type": "chat" - }, + } + ] + }, + "qihang-ai": { + "id": "qihang-ai", + "name": "QiHang", + "display_name": "QiHang", + "api": "https://api.qhaigc.net/v1", + "doc": "https://www.qhaigc.net/docs", + "models": [ { - "id": "qwen3-embedding-4b", - "name": "Qwen3-Embedding 4B", - "display_name": "Qwen3-Embedding 4B", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 2560 + "context": 400000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-06-06", - "last_updated": "2025-06-06", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 2 }, - "type": "embedding" + "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "claude-haiku-4-5-20251001", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ + "text", + "image", + "pdf" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 200000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", + "cost": { + "input": 0.14, + "output": 0.71 + }, + "type": "chat" + }, + { + "id": "gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 1000000, + "output": 65000 }, "temperature": true, "tool_call": true, @@ -145341,108 +153848,236 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-04", - "last_updated": "2025-08-14", + "attachment": true, + "open_weights": false, + "knowledge": "2025-11", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "cost": { - "input": 0, - "output": 0 + "input": 0.57, + "output": 3.43 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b", - "name": "Qwen3-Coder 30B-A3B", - "display_name": "Qwen3-Coder 30B-A3B", + "id": "claude-opus-4-5-20251101", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ + "text", + "image" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 200000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", + "cost": { + "input": 0.71, + "output": 3.57 + }, + "type": "chat" + }, + { + "id": "claude-sonnet-4-5-20250929", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", + "modalities": { + "input": [ + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "cost": { + "input": 0.43, + "output": 2.14 + }, + "type": "chat" + }, + { + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0, - "output": 0 + "input": 0.07, + "output": 0.43, + "tiers": [ + { + "input": 0.07, + "output": 0.43, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 0.07, + "output": 0.43 + } }, "type": "chat" - } - ] - }, - "google": { - "id": "google", - "name": "google", - "display_name": "google", - "doc": "https://ai.google.dev/gemini-api/docs/models", - "models": [ + }, { - "id": "gemini-flash-lite-latest", - "name": "Gemini Flash-Lite Latest", - "display_name": "Gemini Flash-Lite Latest", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.14, + "output": 1.14 }, "type": "chat" }, { - "id": "gemini-2.5-pro-preview-05-06", - "name": "Gemini 2.5 Pro Preview 05-06", - "display_name": "Gemini 2.5 Pro Preview 05-06", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", - "audio", "video", + "audio", "pdf" ], "output": [ @@ -145466,9 +154101,10 @@ "mode": "budget", "budget": { "default": -1, - "min": 128, - "max": 32768, + "min": 0, + "max": 24576, "auto": -1, + "off": 0, "unit": "tokens" }, "summaries": true, @@ -145481,72 +154117,108 @@ "attachment": true, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-05-06", - "last_updated": "2025-05-06", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 + "input": 0.09, + "output": 0.71, + "tiers": [ + { + "input": 0.09, + "output": 0.71, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 0.09, + "output": 0.71 + } }, "type": "chat" }, { - "id": "gemini-live-2.5-flash-preview-native-audio", - "name": "Gemini Live 2.5 Flash Preview Native Audio", - "display_name": "Gemini Live 2.5 Flash Preview Native Audio", + "id": "gpt-5-mini", + "name": "GPT-5-Mini", + "display_name": "GPT-5-Mini", "modalities": { "input": [ "text", - "audio", - "video" + "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-09-18", + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.5, - "output": 2, - "input_audio": 3, - "output_audio": 12 + "input": 0.04, + "output": 0.29 }, "type": "chat" - }, + } + ] + }, + "lilac": { + "id": "lilac", + "name": "Lilac", + "display_name": "Lilac", + "api": "https://api.getlilac.com/v1", + "doc": "https://docs.getlilac.com/inference/models", + "models": [ { - "id": "gemini-3.1-pro-preview-customtools", - "name": "Gemini 3.1 Pro Preview Custom Tools", - "display_name": "Gemini 3.1 Pro Preview Custom Tools", + "id": "moonshotai/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -145557,109 +154229,79 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, - "open_weights": false, + "open_weights": true, "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.7, + "output": 3.5, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-09-2025", - "name": "Gemini 2.5 Flash Lite Preview 09 2025", - "display_name": "Gemini 2.5 Flash Lite Preview 09 2025", + "id": "zai-org/glm-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 202800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": -1, - "min": 512, - "max": 24576 - } + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "search": { - "supported": true, - "default": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.9, + "output": 3, + "cache_read": 0.27 }, "type": "chat" }, { - "id": "gemini-1.5-flash", - "name": "Gemini 1.5 Flash", - "display_name": "Gemini 1.5 Flash", + "id": "google/gemma-4-31b-it", + "name": "Gemma 4 31B IT", + "display_name": "Gemma 4 31B IT", "modalities": { "input": [ "text", "image", - "audio", "video" ], "output": [ @@ -145667,66 +154309,95 @@ ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 262100, + "output": 262100 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-05-14", - "last_updated": "2024-05-14", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.075, - "output": 0.3, - "cache_read": 0.01875 + "input": 0.11, + "output": 0.35 }, "type": "chat" }, { - "id": "gemini-1.5-pro", - "name": "Gemini 1.5 Pro", - "display_name": "Gemini 1.5 Pro", + "id": "minimaxai/minimax-m2.7", + "name": "MiniMax M2.7", + "display_name": "MiniMax M2.7", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 204800, + "output": 204800 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-02-15", - "last_updated": "2024-02-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1.25, - "output": 5, - "cache_read": 0.3125 + "input": 0.3, + "output": 1.2, + "cache_read": 0.055 }, "type": "chat" - }, + } + ] + }, + "alibaba-cn": { + "id": "alibaba-cn", + "name": "alibaba-cn", + "display_name": "alibaba-cn", + "api": "https://dashscope.aliyuncs.com/compatible-mode/v1", + "doc": "https://www.alibabacloud.com/help/en/model-studio/models", + "models": [ { - "id": "gemma-3n-e4b-it", - "name": "Gemma 3n 4B", - "display_name": "Gemma 3n 4B", + "id": "qwen2-5-math-7b-instruct", + "name": "Qwen2.5-Math 7B Instruct", + "display_name": "Qwen2.5-Math 7B Instruct", "modalities": { "input": [ "text" @@ -145736,186 +154407,152 @@ ] }, "limit": { - "context": 8192, - "output": 2000 + "context": 4096, + "output": 3072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0, - "output": 0 + "input": 0.144, + "output": 0.287 }, "type": "chat" }, { - "id": "gemini-3.1-flash-lite-preview", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "qwen2-5-7b-instruct", + "name": "Qwen2.5 7B Instruct", + "display_name": "Qwen2.5 7B Instruct", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "input": 0.072, + "output": 0.144 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "qwen2-5-vl-72b-instruct", + "name": "Qwen2.5-VL 72B Instruct", + "display_name": "Qwen2.5-VL 72B Instruct", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 2.294, + "output": 6.881 }, "type": "chat" }, { - "id": "gemini-2.0-flash", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "kimi-k2.5", + "name": "Moonshot Kimi K2.5", + "display_name": "Moonshot Kimi K2.5", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, - "search": { - "supported": true, - "default": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.574, + "output": 2.411 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ "text", "image", - "video", - "audio", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 1000000, "output": 65536 }, "temperature": true, @@ -145927,90 +154564,73 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "context_over_200k": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 - } + "input": 0.573, + "output": 3.44, + "reasoning": 3.44 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-tts", - "name": "Gemini 2.5 Flash Preview TTS", - "display_name": "Gemini 2.5 Flash Preview TTS", + "id": "qwen-math-turbo", + "name": "Qwen Math Turbo", + "display_name": "Qwen Math Turbo", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8000, - "output": 16000 + "context": 4096, + "output": 3072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", + "knowledge": "2024-04", + "release_date": "2024-09-19", + "last_updated": "2024-09-19", "cost": { - "input": 0.5, - "output": 10 + "input": 0.287, + "output": 0.861 }, "type": "chat" }, { - "id": "gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 202752, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -146021,99 +154641,80 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-14", + "last_updated": "2026-04-14", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.87, + "output": 3.48, + "cache_read": 0.17 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-05-20", - "name": "Gemini 2.5 Flash Preview 05-20", - "display_name": "Gemini 2.5 Flash Preview 05-20", + "id": "qwen3-vl-plus", + "name": "Qwen3 VL Plus", + "display_name": "Qwen3 VL Plus", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.0375 + "input": 0.143353, + "output": 1.433525, + "reasoning": 4.300576 }, "type": "chat" }, { - "id": "gemini-embedding-001", - "name": "Gemini Embedding 001", - "display_name": "Gemini Embedding 001", + "id": "qwen2-5-math-72b-instruct", + "name": "Qwen2.5-Math 72B Instruct", + "display_name": "Qwen2.5-Math 72B Instruct", "modalities": { "input": [ "text" @@ -146123,29 +154724,29 @@ ] }, "limit": { - "context": 2048, + "context": 4096, "output": 3072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.15, - "output": 0 + "input": 0.574, + "output": 1.721 }, - "type": "embedding" + "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "qwen3-vl-235b-a22b", + "name": "Qwen3-VL 235B-A22B", + "display_name": "Qwen3-VL 235B-A22B", "modalities": { "input": [ "text", @@ -146156,79 +154757,85 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": -1, - "min": 128, - "max": 32768 - } + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "search": { + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", + "cost": { + "input": 0.286705, + "output": 1.14682, + "reasoning": 2.867051 + }, + "type": "chat" + }, + { + "id": "deepseek-r1-distill-llama-8b", + "name": "DeepSeek R1 Distill Llama 8B", + "display_name": "DeepSeek R1 Distill Llama 8B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32768, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { "supported": true, - "default": false + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gemini-flash-latest", - "name": "Gemini Flash Latest", - "display_name": "Gemini Flash Latest", + "id": "deepseek-r1", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -146236,34 +154843,41 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "input_audio": 1 + "input": 0.574, + "output": 2.294 }, "type": "chat" }, { - "id": "gemma-4-31b-it", - "name": "Gemma 4 31B", - "display_name": "Gemma 4 31B", + "id": "qwq-32b", + "name": "QwQ 32B", + "display_name": "QwQ 32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 131072, "output": 8192 }, "temperature": true, @@ -146272,170 +154886,183 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "knowledge": "2024-04", + "release_date": "2024-12", + "last_updated": "2024-12", + "cost": { + "input": 0.287, + "output": 0.861 + }, "type": "chat" }, { - "id": "gemini-2.5-pro-preview-06-05", - "name": "Gemini 2.5 Pro Preview 06-05", - "display_name": "Gemini 2.5 Pro Preview 06-05", + "id": "qwq-plus", + "name": "QwQ Plus", + "display_name": "QwQ Plus", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 32768, + "min": 0, + "max": 32768 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "knowledge": "2024-04", + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 + "input": 0.23, + "output": 0.574 }, "type": "chat" }, { - "id": "gemini-2.5-flash-image", - "name": "Gemini 2.5 Flash Image", - "display_name": "Gemini 2.5 Flash Image", + "id": "qwen3-8b", + "name": "Qwen3 8B", + "display_name": "Qwen3 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.3, - "output": 30, - "cache_read": 0.075 + "input": 0.072, + "output": 0.287, + "reasoning": 0.717 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-06-17", - "name": "Gemini 2.5 Flash Lite Preview 06-17", - "display_name": "Gemini 2.5 Flash Lite Preview 06-17", + "id": "deepseek-r1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025, - "input_audio": 0.3 + "input": 0.574, + "output": 2.294 }, "type": "chat" }, { - "id": "gemma-3-12b-it", - "name": "Gemma 3 12B", - "display_name": "Gemma 3 12B", + "id": "deepseek-r1-distill-qwen-1-5b", + "name": "DeepSeek R1 Distill Qwen 1.5B", + "display_name": "DeepSeek R1 Distill Qwen 1.5B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -146443,18 +155070,18 @@ }, "limit": { "context": 32768, - "output": 8192 + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { "input": 0, "output": 0 @@ -146462,74 +155089,41 @@ "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "qwen2-5-coder-32b-instruct", + "name": "Qwen2.5-Coder 32B Instruct", + "display_name": "Qwen2.5-Coder 32B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": -1, - "min": 0, - "max": 24576 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "search": { - "supported": true, - "default": false + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-11", + "last_updated": "2024-11", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.03, - "input_audio": 1 + "input": 0.287, + "output": 0.861 }, "type": "chat" }, { - "id": "gemma-3n-e2b-it", - "name": "Gemma 3n 2B", - "display_name": "Gemma 3n 2B", + "id": "tongyi-intent-detect-v3", + "name": "Tongyi Intent Detect V3", + "display_name": "Tongyi Intent Detect V3", "modalities": { "input": [ "text" @@ -146540,160 +155134,164 @@ }, "limit": { "context": 8192, - "output": 2000 + "output": 1024 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "cost": { - "input": 0, - "output": 0 + "input": 0.058, + "output": 0.144 }, "type": "chat" }, { - "id": "gemini-3.1-flash-image-preview", - "name": "Gemini 3.1 Flash Image (Preview)", - "display_name": "Gemini 3.1 Flash Image (Preview)", + "id": "deepseek-v3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 65536, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.25, - "output": 60 + "input": 0.287, + "output": 1.147 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "gemini-3.1-flash-lite", - "name": "Gemini 3.1 Flash Lite", - "display_name": "Gemini 3.1 Flash Lite", + "id": "qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-05-07", - "last_updated": "2026-05-07", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "input": 0.861, + "output": 3.441 }, "type": "chat" }, { - "id": "gemma-3-4b-it", - "name": "Gemma 3 4B", - "display_name": "Gemma 3 4B", + "id": "qwen3-235b-a22b", + "name": "Qwen3 235B A22B", + "display_name": "Qwen3 235B A22B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0, - "output": 0 + "input": 0.287, + "output": 1.147, + "reasoning": 2.868 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-04-17", - "name": "Gemini 2.5 Flash Preview 04-17", - "display_name": "Gemini 2.5 Flash Preview 04-17", + "id": "qwen3.5-397b-a17b", + "name": "Qwen3.5 397B-A17B", + "display_name": "Qwen3.5 397B-A17B", "modalities": { "input": [ "text", "image", - "audio", - "video", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, @@ -146705,230 +155303,197 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-04-17", - "last_updated": "2025-04-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.0375 + "input": 0.43, + "output": 2.58, + "reasoning": 2.58 }, "type": "chat" }, { - "id": "gemini-2.5-pro-preview-tts", - "name": "Gemini 2.5 Pro Preview TTS", - "display_name": "Gemini 2.5 Pro Preview TTS", + "id": "qwen-doc-turbo", + "name": "Qwen Doc Turbo", + "display_name": "Qwen Doc Turbo", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8000, - "output": 16000 + "context": 131072, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "cost": { - "input": 1, - "output": 20 + "input": 0.087, + "output": 0.144 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-09-2025", - "name": "Gemini 2.5 Flash Preview 09 2025", - "display_name": "Gemini 2.5 Flash Preview 09 2025", + "id": "qwen-flash", + "name": "Qwen Flash", + "display_name": "Qwen Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, + "default": false, "budget": { - "default": -1, + "default": 81920, "min": 0, - "max": 24576 + "max": 81920 } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "search": { "supported": true, - "default": false + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2024-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "input_audio": 1 + "input": 0.022, + "output": 0.216 }, "type": "chat" }, { - "id": "gemma-3-27b-it", - "name": "Gemma 3 27B", - "display_name": "Gemma 3 27B", + "id": "qwen-omni-turbo-realtime", + "name": "Qwen-Omni Turbo Realtime", + "display_name": "Qwen-Omni Turbo Realtime", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32768, + "output": 2048 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-03-12", - "last_updated": "2025-03-12", + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "cost": { - "input": 0, - "output": 0 + "input": 0.23, + "output": 0.918, + "input_audio": 3.584, + "output_audio": 7.168 }, "type": "chat" }, { - "id": "gemma-4-26b-a4b-it", - "name": "Gemma 4 26B", - "display_name": "Gemma 4 26B", + "id": "qwen-mt-turbo", + "name": "Qwen Mt Turbo", + "display_name": "Qwen Mt Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 16384, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01", + "last_updated": "2025-01", + "cost": { + "input": 0.101, + "output": 0.28 + }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "qwen-turbo", + "name": "Qwen Turbo", + "display_name": "Qwen Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -146936,98 +155501,85 @@ "supported": true, "default": false, "budget": { - "default": -1, - "min": 512, - "max": 24576 + "default": 38912, + "min": 0, + "max": 38912 } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "search": { "supported": true, - "default": false + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2024-04", + "release_date": "2024-11-01", + "last_updated": "2025-07-15", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.044, + "output": 0.087, + "reasoning": 0.431 }, "type": "chat" }, { - "id": "gemini-2.5-flash-image-preview", - "name": "Gemini 2.5 Flash Image Preview", - "display_name": "Gemini 2.5 Flash Image Preview", + "id": "moonshot-kimi-k2-instruct", + "name": "Moonshot Kimi K2 Instruct", + "display_name": "Moonshot Kimi K2 Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "open_weights": true, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.3, - "output": 30, - "cache_read": 0.075 + "input": 0.574, + "output": 2.294 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "gemini-1.5-flash-8b", - "name": "Gemini 1.5 Flash-8B", - "display_name": "Gemini 1.5 Flash-8B", + "id": "qwen-max", + "name": "Qwen Max", + "display_name": "Qwen Max", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 32768, "output": 8192 }, "temperature": true, @@ -147035,72 +155587,70 @@ "reasoning": { "supported": false }, - "attachment": true, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" + }, + "attachment": false, "open_weights": false, "knowledge": "2024-04", - "release_date": "2024-10-03", - "last_updated": "2024-10-03", + "release_date": "2024-04-03", + "last_updated": "2025-01-25", "cost": { - "input": 0.0375, - "output": 0.15, - "cache_read": 0.01 + "input": 0.345, + "output": 1.377 }, "type": "chat" }, { - "id": "gemini-live-2.5-flash", - "name": "Gemini Live 2.5 Flash", - "display_name": "Gemini Live 2.5 Flash", + "id": "qwen2-5-vl-7b-instruct", + "name": "Qwen2.5-VL 7B Instruct", + "display_name": "Qwen2.5-VL 7B Instruct", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 128000, - "output": 8000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-01", - "last_updated": "2025-09-01", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.5, - "output": 2, - "input_audio": 3, - "output_audio": 12 + "input": 0.287, + "output": 0.717 }, "type": "chat" }, { - "id": "gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash Lite", - "display_name": "Gemini 2.0 Flash Lite", + "id": "qwen2-5-32b-instruct", + "name": "Qwen2.5 32B Instruct", + "display_name": "Qwen2.5 32B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 131072, "output": 8192 }, "temperature": true, @@ -147108,62 +155658,53 @@ "reasoning": { "supported": false }, - "search": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.075, - "output": 0.3 + "input": 0.287, + "output": 0.861 }, "type": "chat" }, { - "id": "gemini-2.0-flash-preview-image-generation", - "name": "Gemini 2.0 Flash Preview Image Generation", - "display_name": "Gemini 2.0 Flash Preview Image Generation", + "id": "qwen3-asr-flash", + "name": "Qwen3-ASR Flash", + "display_name": "Qwen3-ASR Flash", "modalities": { "input": [ - "text", - "image" + "audio" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 53248, + "output": 4096 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "search": { - "supported": false + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-09-08", + "last_updated": "2025-09-08", + "cost": { + "input": 0.032, + "output": 0.032 }, - "attachment": true, "type": "chat" - } - ] - }, - "drun": { - "id": "drun", - "name": "D.Run (China)", - "display_name": "D.Run (China)", - "api": "https://chat.d.run/v1", - "doc": "https://www.d.run", - "models": [ + }, { - "id": "public/deepseek-r1", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "qwen-math-plus", + "name": "Qwen Math Plus", + "display_name": "Qwen Math Plus", "modalities": { "input": [ "text" @@ -147173,52 +155714,42 @@ ] }, "limit": { - "context": 131072, - "output": 32000 + "context": 4096, + "output": 3072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-08-16", + "last_updated": "2024-09-19", "cost": { - "input": 0.55, - "output": 2.2 + "input": 0.574, + "output": 1.721 }, "type": "chat" }, { - "id": "public/minimax-m25", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -147239,18 +155770,39 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.29, - "output": 1.16 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 0.625, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5 + } }, "type": "chat" }, { - "id": "public/deepseek-v3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "qwen3-coder-flash", + "name": "Qwen3 Coder Flash", + "display_name": "Qwen3 Coder Flash", "modalities": { "input": [ "text" @@ -147260,8 +155812,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -147269,29 +155821,20 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-12-26", - "last_updated": "2024-12-26", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.28, - "output": 1.1 + "input": 0.144, + "output": 0.574 }, "type": "chat" - } - ] - }, - "moonshot-ai": { - "id": "moonshot-ai", - "name": "Moonshot AI", - "display_name": "Moonshot AI", - "api": "https://api.moonshot.ai/v1", - "doc": "https://platform.moonshot.ai/docs/api/chat", - "models": [ + }, { - "id": "kimi-k2-0905-preview", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "qwen-plus-character", + "name": "Qwen Plus Character", + "display_name": "Qwen Plus Character", "modalities": { "input": [ "text" @@ -147301,8 +155844,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 32768, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -147310,40 +155853,42 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 0.115, + "output": 0.287 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "extra_capabilities": { "reasoning": { @@ -147358,20 +155903,20 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 0.287, + "output": 1.147, + "reasoning": 2.868 }, "type": "chat" }, { - "id": "kimi-k2-thinking-turbo", - "name": "Kimi K2 Thinking Turbo", - "display_name": "Kimi K2 Thinking Turbo", + "id": "qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ "text" @@ -147381,14 +155926,19 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { @@ -147403,25 +155953,22 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 1.15, - "output": 8, - "cache_read": 0.15 + "input": 0.144, + "output": 1.434 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "kimi-k2-thinking", + "name": "Moonshot Kimi K2 Thinking", + "display_name": "Moonshot Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" @@ -147429,7 +155976,7 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -147448,22 +155995,20 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.574, + "output": 2.294 }, "type": "chat" }, { - "id": "kimi-k2-turbo-preview", - "name": "Kimi K2 Turbo", - "display_name": "Kimi K2 Turbo", + "id": "deepseek-r1-distill-qwen-14b", + "name": "DeepSeek R1 Distill Qwen 14B", + "display_name": "DeepSeek R1 Distill Qwen 14B", "modalities": { "input": [ "text" @@ -147473,30 +156018,29 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 2.4, - "output": 10, - "cache_read": 0.6 + "input": 0.144, + "output": 0.431 }, "type": "chat" }, { - "id": "kimi-k2-0711-preview", - "name": "Kimi K2 0711", - "display_name": "Kimi K2 0711", + "id": "qwen-deep-research", + "name": "Qwen Deep Research", + "display_name": "Qwen Deep Research", "modalities": { "input": [ "text" @@ -147506,8 +156050,8 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -147515,21 +156059,20 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-14", - "last_updated": "2025-07-14", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 7.742, + "output": 23.367 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "qwen-mt-plus", + "name": "Qwen Mt Plus", + "display_name": "Qwen Mt Plus", "modalities": { "input": [ "text" @@ -147539,8 +156082,40 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 16384, + "output": 8192 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01", + "last_updated": "2025-01", + "cost": { + "input": 0.259, + "output": 0.775 + }, + "type": "chat" + }, + { + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -147561,40 +156136,101 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 0.3, + "output": 1.2 }, "type": "chat" - } - ] - }, - "berget": { - "id": "berget", - "name": "Berget.AI", - "display_name": "Berget.AI", - "api": "https://api.berget.ai/v1", - "doc": "https://api.berget.ai", - "models": [ + }, { - "id": "zai-org/GLM-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "qwen-vl-plus", + "name": "Qwen-VL Plus", + "display_name": "Qwen-VL Plus", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-08-15", + "cost": { + "input": 0.115, + "output": 0.287 + }, + "type": "chat" + }, + { + "id": "qwen-omni-turbo", + "name": "Qwen-Omni Turbo", + "display_name": "Qwen-Omni Turbo", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text", + "audio" + ] + }, + "limit": { + "context": 32768, + "output": 2048 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01-19", + "last_updated": "2025-03-26", + "cost": { + "input": 0.058, + "output": 0.23, + "input_audio": 3.584, + "output_audio": 7.168 + }, + "type": "chat" + }, + { + "id": "qwen3-vl-30b-a3b", + "name": "Qwen3-VL 30B-A3B", + "display_name": "Qwen3-VL 30B-A3B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -147615,19 +156251,20 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.77, - "output": 2.75 + "input": 0.108, + "output": 0.431, + "reasoning": 1.076 }, "type": "chat" }, { - "id": "mistralai/Mistral-Small-3.2-24B-Instruct-2506", - "name": "Mistral Small 3.2 24B Instruct 2506", - "display_name": "Mistral Small 3.2 24B Instruct 2506", + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ "text" @@ -147637,8 +156274,8 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -147646,55 +156283,25 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-10-01", - "last_updated": "2025-10-01", - "cost": { - "input": 0.33, - "output": 0.33 - }, - "type": "chat" - }, - { - "id": "mistralai/Mistral-Medium-3.5-128B", - "name": "Mistral Medium 3.5 128B", - "display_name": "Mistral Medium 3.5 128B", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 131072 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true + "extra_capabilities": { + "reasoning": { + "supported": true + } }, - "attachment": true, - "open_weights": true, - "knowledge": "2026-04", - "release_date": "2026-04-29", - "last_updated": "2026-04-29", + "attachment": false, + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.65, - "output": 5.5 + "input": 0.287, + "output": 0.861 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "deepseek-v3-1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text" @@ -147704,41 +156311,41 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-04-27", - "last_updated": "2025-04-27", + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.99, - "output": 0.99 + "input": 0.574, + "output": 1.721 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT-OSS-120B", - "display_name": "GPT-OSS-120B", + "id": "qwen3.5-flash", + "name": "Qwen3.5 Flash", + "display_name": "Qwen3.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -147748,69 +156355,64 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 0.44, - "output": 0.99 + "input": 0.172, + "output": 1.72, + "reasoning": 1.72 }, "type": "chat" }, { - "id": "google/gemma-4-31B-it", - "name": "Gemma 4 31B Instruct", - "display_name": "Gemma 4 31B Instruct", + "id": "qwen-vl-ocr", + "name": "Qwen Vl Ocr", + "display_name": "Qwen Vl Ocr", "modalities": { "input": [ - "audio", - "image", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 34096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-10-28", + "last_updated": "2025-04-13", "cost": { - "input": 0.275, - "output": 0.55 + "input": 0.717, + "output": 0.717 }, "type": "chat" - } - ] - }, - "github-models": { - "id": "github-models", - "name": "GitHub Models", - "display_name": "GitHub Models", - "api": "https://models.github.ai/inference", - "doc": "https://docs.github.com/en/github-models", - "models": [ + }, { - "id": "deepseek/deepseek-v3-0324", - "name": "DeepSeek-V3-0324", - "display_name": "DeepSeek-V3-0324", + "id": "qwen-long", + "name": "Qwen Long", + "display_name": "Qwen Long", "modalities": { "input": [ "text" @@ -147820,30 +156422,29 @@ ] }, "limit": { - "context": 128000, + "context": 1000000, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01-25", + "last_updated": "2025-01-25", "cost": { - "input": 0, - "output": 0 + "input": 0.072, + "output": 0.287 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "deepseek-r1-distill-qwen-32b", + "name": "DeepSeek R1 Distill Qwen 32B", + "display_name": "DeepSeek R1 Distill Qwen 32B", "modalities": { "input": [ "text" @@ -147853,8 +156454,8 @@ ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -147862,43 +156463,35 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0, - "output": 0 + "input": 0.287, + "output": 0.861 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "qwen3-omni-flash", + "name": "Qwen3-Omni Flash", + "display_name": "Qwen3-Omni Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { "context": 65536, - "output": 8192 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -147918,20 +156511,22 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0, - "output": 0 + "input": 0.058, + "output": 0.23, + "input_audio": 3.584, + "output_audio": 7.168 }, "type": "chat" }, { - "id": "ai21-labs/ai21-jamba-1.5-mini", - "name": "AI21 Jamba 1.5 Mini", - "display_name": "AI21 Jamba 1.5 Mini", + "id": "qwen2-5-14b-instruct", + "name": "Qwen2.5 14B Instruct", + "display_name": "Qwen2.5 14B Instruct", "modalities": { "input": [ "text" @@ -147941,30 +156536,29 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-08-29", - "last_updated": "2024-08-29", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0, - "output": 0 + "input": 0.144, + "output": 0.431 }, "type": "chat" }, { - "id": "ai21-labs/ai21-jamba-1.5-large", - "name": "AI21 Jamba 1.5 Large", - "display_name": "AI21 Jamba 1.5 Large", + "id": "qwen2-5-72b-instruct", + "name": "Qwen2.5 72B Instruct", + "display_name": "Qwen2.5 72B Instruct", "modalities": { "input": [ "text" @@ -147974,30 +156568,29 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-08-29", - "last_updated": "2024-08-29", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0, - "output": 0 + "input": 0.574, + "output": 1.721 }, "type": "chat" }, { - "id": "microsoft/phi-3.5-mini-instruct", - "name": "Phi-3.5-mini instruct (128k)", - "display_name": "Phi-3.5-mini instruct (128k)", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "Qwen3-Coder 480B-A35B Instruct", + "display_name": "Qwen3-Coder 480B-A35B Instruct", "modalities": { "input": [ "text" @@ -148007,41 +156600,41 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0, - "output": 0 + "input": 0.861, + "output": 3.441 }, "type": "chat" }, { - "id": "microsoft/phi-3-medium-4k-instruct", - "name": "Phi-3-medium instruct (4k)", - "display_name": "Phi-3-medium instruct (4k)", + "id": "qvq-max", + "name": "QVQ Max", + "display_name": "QVQ Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -148050,20 +156643,20 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0, - "output": 0 + "input": 1.147, + "output": 4.588 }, "type": "chat" }, { - "id": "microsoft/phi-3.5-moe-instruct", - "name": "Phi-3.5-MoE instruct (128k)", - "display_name": "Phi-3.5-MoE instruct (128k)", + "id": "qwen3.6-max-preview", + "name": "Qwen3.6 Max Preview", + "display_name": "Qwen3.6 Max Preview", "modalities": { "input": [ "text" @@ -148073,8 +156666,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 245800, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -148082,21 +156675,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "open_weights": false, + "release_date": "2026-04-20", + "last_updated": "2026-04-21", "cost": { - "input": 0, - "output": 0 + "input": 1.32, + "output": 7.9, + "cache_read": 0.132 }, "type": "chat" }, { - "id": "microsoft/phi-3-mini-128k-instruct", - "name": "Phi-3-mini instruct (128k)", - "display_name": "Phi-3-mini instruct (128k)", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder 30B-A3B Instruct", + "display_name": "Qwen3-Coder 30B-A3B Instruct", "modalities": { "input": [ "text" @@ -148106,63 +156710,66 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0, - "output": 0 + "input": 0.216, + "output": 0.861 }, "type": "chat" }, { - "id": "microsoft/phi-4-mini-instruct", - "name": "Phi-4-mini-instruct", - "display_name": "Phi-4-mini-instruct", + "id": "qwen3-omni-flash-realtime", + "name": "Qwen3-Omni Flash Realtime", + "display_name": "Qwen3-Omni Flash Realtime", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 65536, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0, - "output": 0 + "input": 0.23, + "output": 0.918, + "input_audio": 3.584, + "output_audio": 7.168 }, "type": "chat" }, { - "id": "microsoft/phi-4-reasoning", - "name": "Phi-4-Reasoning", - "display_name": "Phi-4-Reasoning", + "id": "qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ "text" @@ -148172,30 +156779,29 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 0, - "output": 0 + "input": 0.144, + "output": 0.574 }, "type": "chat" }, { - "id": "microsoft/phi-3-small-8k-instruct", - "name": "Phi-3-small instruct (8k)", - "display_name": "Phi-3-small instruct (8k)", + "id": "deepseek-r1-distill-qwen-7b", + "name": "DeepSeek R1 Distill Qwen 7B", + "display_name": "DeepSeek R1 Distill Qwen 7B", "modalities": { "input": [ "text" @@ -148205,8 +156811,8 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -148215,20 +156821,19 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0, - "output": 0 + "input": 0.072, + "output": 0.144 }, "type": "chat" }, { - "id": "microsoft/phi-3.5-vision-instruct", - "name": "Phi-3.5-vision instruct (128k)", - "display_name": "Phi-3.5-vision instruct (128k)", + "id": "qwen-vl-max", + "name": "Qwen-VL Max", + "display_name": "Qwen-VL Max", "modalities": { "input": [ "text", @@ -148239,63 +156844,66 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-04-08", + "last_updated": "2025-08-13", "cost": { - "input": 0, - "output": 0 + "input": 0.23, + "output": 0.574 }, "type": "chat" }, { - "id": "microsoft/phi-3-mini-4k-instruct", - "name": "Phi-3-mini instruct (4k)", - "display_name": "Phi-3-mini instruct (4k)", + "id": "qwen2-5-omni-7b", + "name": "Qwen2.5-Omni 7B", + "display_name": "Qwen2.5-Omni 7B", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 32768, + "output": 2048 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2024-04", + "release_date": "2024-12", + "last_updated": "2024-12", "cost": { - "input": 0, - "output": 0 + "input": 0.087, + "output": 0.345, + "input_audio": 5.448 }, "type": "chat" }, { - "id": "microsoft/phi-4-mini-reasoning", - "name": "Phi-4-mini-reasoning", - "display_name": "Phi-4-mini-reasoning", + "id": "qwen-plus", + "name": "Qwen Plus", + "display_name": "Qwen Plus", "modalities": { "input": [ "text" @@ -148305,63 +156913,53 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - }, - { - "id": "microsoft/phi-3-small-128k-instruct", - "name": "Phi-3-small instruct (128k)", - "display_name": "Phi-3-small instruct (128k)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "limit": { - "context": 128000, - "output": 4096 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, - "temperature": true, - "tool_call": true, - "reasoning": { + "search": { "supported": true, - "default": true + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-09-11", "cost": { - "input": 0, - "output": 0 + "input": 0.115, + "output": 0.287, + "reasoning": 1.147 }, "type": "chat" }, { - "id": "microsoft/phi-3-medium-128k-instruct", - "name": "Phi-3-medium instruct (128k)", - "display_name": "Phi-3-medium instruct (128k)", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -148371,8 +156969,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 202752, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -148380,32 +156978,44 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "open_weights": false, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0, - "output": 0 + "input": 0.86, + "output": 3.15 }, "type": "chat" }, { - "id": "microsoft/phi-4", - "name": "Phi-4", - "display_name": "Phi-4", + "id": "kimi-k2.6", + "name": "Moonshot Kimi K2.6", + "display_name": "Moonshot Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -148413,56 +157023,64 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0, - "output": 0 + "input": 0.929, + "output": 3.858 }, "type": "chat" }, { - "id": "microsoft/phi-4-multimodal-instruct", - "name": "Phi-4-multimodal-instruct", - "display_name": "Phi-4-multimodal-instruct", + "id": "qwen2-5-coder-7b-instruct", + "name": "Qwen2.5-Coder 7B Instruct", + "display_name": "Qwen2.5-Coder 7B Instruct", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2024-04", + "release_date": "2024-11", + "last_updated": "2024-11", "cost": { - "input": 0, - "output": 0 + "input": 0.144, + "output": 0.287 }, "type": "chat" }, { - "id": "microsoft/mai-ds-r1", - "name": "MAI-DS-R1", - "display_name": "MAI-DS-R1", + "id": "qwen3-14b", + "name": "Qwen3 14B", + "display_name": "Qwen3 14B", "modalities": { "input": [ "text" @@ -148472,30 +157090,47 @@ ] }, "limit": { - "context": 65536, + "context": 131072, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0, - "output": 0 + "input": 0.144, + "output": 0.574, + "reasoning": 1.434 }, "type": "chat" }, { - "id": "cohere/cohere-command-r-08-2024", - "name": "Cohere Command R 08-2024", - "display_name": "Cohere Command R 08-2024", + "id": "deepseek-v3-2-exp", + "name": "DeepSeek V3.2 Exp", + "display_name": "DeepSeek V3.2 Exp", "modalities": { "input": [ "text" @@ -148505,8 +157140,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -148515,19 +157150,18 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-08-01", - "last_updated": "2024-08-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0, - "output": 0 + "input": 0.287, + "output": 0.431 }, "type": "chat" }, { - "id": "cohere/cohere-command-a", - "name": "Cohere Command A", - "display_name": "Cohere Command A", + "id": "qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", "modalities": { "input": [ "text" @@ -148537,62 +157171,76 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0, - "output": 0 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "cohere/cohere-command-r-plus", - "name": "Cohere Command R+", - "display_name": "Cohere Command R+", + "id": "kimi/kimi-k2.5", + "name": "kimi/kimi-k2.5", + "display_name": "kimi/kimi-k2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-04-04", - "last_updated": "2024-08-01", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "cohere/cohere-command-r", - "name": "Cohere Command R", - "display_name": "Cohere Command R", + "id": "siliconflow/deepseek-r1-0528", + "name": "siliconflow/deepseek-r1-0528", + "display_name": "siliconflow/deepseek-r1-0528", "modalities": { "input": [ "text" @@ -148602,8 +157250,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 163840, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -148611,21 +157259,31 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-03-11", - "last_updated": "2024-08-01", + "release_date": "2025-05-28", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.5, + "output": 2.18 }, "type": "chat" }, { - "id": "cohere/cohere-command-r-plus-08-2024", - "name": "Cohere Command R+ 08-2024", - "display_name": "Cohere Command R+ 08-2024", + "id": "siliconflow/deepseek-v3-0324", + "name": "siliconflow/deepseek-v3-0324", + "display_name": "siliconflow/deepseek-v3-0324", "modalities": { "input": [ "text" @@ -148635,8 +157293,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, @@ -148645,19 +157303,18 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-08-01", - "last_updated": "2024-08-01", + "release_date": "2024-12-26", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "xai/grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "siliconflow/deepseek-v3.2", + "name": "siliconflow/deepseek-v3.2", + "display_name": "siliconflow/deepseek-v3.2", "modalities": { "input": [ "text" @@ -148667,8 +157324,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -148676,21 +157333,25 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-09", - "last_updated": "2024-12-09", + "release_date": "2025-12-03", + "last_updated": "2025-12-03", "cost": { - "input": 0, - "output": 0 + "input": 0.27, + "output": 0.42 }, "type": "chat" }, { - "id": "xai/grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "siliconflow/deepseek-v3.1-terminus", + "name": "siliconflow/deepseek-v3.1-terminus", + "display_name": "siliconflow/deepseek-v3.1-terminus", "modalities": { "input": [ "text" @@ -148700,8 +157361,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -148711,19 +157372,18 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-09", - "last_updated": "2024-12-09", + "release_date": "2025-09-29", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "openai/o1-mini", - "name": "OpenAI o1-mini", - "display_name": "OpenAI o1-mini", + "id": "MiniMax/MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ "text" @@ -148733,11 +157393,11 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 204800, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -148745,81 +157405,44 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-09-12", - "last_updated": "2024-12-17", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - }, - { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", - "modalities": { - "input": [ - "text", - "image", - "audio" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 16384 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "OpenAI o4-mini", - "display_name": "OpenAI o4-mini", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1000000, + "output": 384000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -148827,32 +157450,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0, - "output": 0 + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "openai/o1-preview", - "name": "OpenAI o1-preview", - "display_name": "OpenAI o1-preview", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -148862,11 +157483,11 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1000000, + "output": 384000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -148874,80 +157495,54 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0, - "output": 0 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "openai/o1", - "name": "OpenAI o1", - "display_name": "OpenAI o1", + "id": "qwen3-coder-plus-2025-09-23", + "name": "Qwen3 Coder Plus 2025 09 23", + "display_name": "Qwen3 Coder Plus 2025 09 23", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1000000, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-09-12", - "last_updated": "2024-12-17", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "openai/o3-mini", - "name": "OpenAI o3-mini", - "display_name": "OpenAI o3-mini", + "id": "qwen3-coder-plus-2025-07-22", + "name": "Qwen3 Coder Plus 2025 07 22", + "display_name": "Qwen3 Coder Plus 2025 07 22", "modalities": { "input": [ "text" @@ -148957,44 +157552,21 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1000000, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "openai/gpt-4.1-nano", - "name": "GPT-4.1-nano", - "display_name": "GPT-4.1-nano", + "id": "qwen-vl-ocr-latest", + "name": "Qwen Vl Ocr Latest", + "display_name": "Qwen Vl Ocr Latest", "modalities": { "input": [ "text", @@ -149005,29 +157577,21 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 34096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": false, "type": "chat" }, { - "id": "openai/o3", - "name": "OpenAI o3", - "display_name": "OpenAI o3", + "id": "qvq-max-2025-05-15", + "name": "Qvq Max 2025 05 15", + "display_name": "Qvq Max 2025 05 15", "modalities": { "input": [ "text", @@ -149038,178 +157602,192 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "default": false, + "budget": { + "default": 16384, + "min": 0, + "max": 16384 } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "qwen-turbo-latest", + "name": "Qwen Turbo Latest", + "display_name": "Qwen Turbo Latest", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "qwen-turbo-2024-09-19", + "name": "Qwen Turbo 2024 09 19", + "display_name": "Qwen Turbo 2024 09 19", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": false, "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1-mini", - "display_name": "GPT-4.1-mini", + "id": "qwen-flash-2025-07-28", + "name": "Qwen Flash 2025 07 28", + "display_name": "Qwen Flash 2025 07 28", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "meta/llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout 17B 16E Instruct", - "display_name": "Llama 4 Scout 17B 16E Instruct", + "id": "qwen-plus-latest", + "name": "Qwen Plus Latest", + "display_name": "Qwen Plus Latest", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "meta/meta-llama-3.1-8b-instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", + "id": "qwen-plus-2024-09-19", + "name": "Qwen Plus 2024 09 19", + "display_name": "Qwen Plus 2024 09 19", "modalities": { "input": [ "text" @@ -149219,30 +157797,21 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "meta/llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "qwen-plus-2025-07-14", + "name": "Qwen Plus 2025 07 14", + "display_name": "Qwen Plus 2025 07 14", "modalities": { "input": [ "text" @@ -149252,30 +157821,44 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "meta/meta-llama-3-70b-instruct", - "name": "Meta-Llama-3-70B-Instruct", - "display_name": "Meta-Llama-3-70B-Instruct", + "id": "qwen-plus-2025-09-11", + "name": "Qwen Plus 2025 09 11", + "display_name": "Qwen Plus 2025 09 11", "modalities": { "input": [ "text" @@ -149285,100 +157868,104 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "meta/llama-3.2-90b-vision-instruct", - "name": "Llama-3.2-90B-Vision-Instruct", - "display_name": "Llama-3.2-90B-Vision-Instruct", + "id": "qwen-max-latest", + "name": "Qwen Max Latest", + "display_name": "Qwen Max Latest", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { + "supported": false + }, + "search": { "supported": true, - "default": true + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "meta/llama-3.2-11b-vision-instruct", - "name": "Llama-3.2-11B-Vision-Instruct", - "display_name": "Llama-3.2-11B-Vision-Instruct", + "id": "qwen-max-2024-09-19", + "name": "Qwen Max 2024 09 19", + "display_name": "Qwen Max 2024 09 19", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 32768, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { + "supported": false + }, + "search": { "supported": true, - "default": true + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "meta/meta-llama-3.1-405b-instruct", - "name": "Meta-Llama-3.1-405B-Instruct", - "display_name": "Meta-Llama-3.1-405B-Instruct", + "id": "qwen-max-2024-04-28", + "name": "Qwen Max 2024 04 28", + "display_name": "Qwen Max 2024 04 28", "modalities": { "input": [ "text" @@ -149388,30 +157975,21 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 8000, + "output": 2000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "meta/meta-llama-3.1-70b-instruct", - "name": "Meta-Llama-3.1-70B-Instruct", - "display_name": "Meta-Llama-3.1-70B-Instruct", + "id": "qwen-max-2024-04-03", + "name": "Qwen Max 2024 04 03", + "display_name": "Qwen Max 2024 04 03", "modalities": { "input": [ "text" @@ -149421,30 +157999,21 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 8000, + "output": 2000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "meta/meta-llama-3-8b-instruct", - "name": "Meta-Llama-3-8B-Instruct", - "display_name": "Meta-Llama-3-8B-Instruct", + "id": "qwen-max-2025-01-25", + "name": "Qwen Max 2025 01 25", + "display_name": "Qwen Max 2025 01 25", "modalities": { "input": [ "text" @@ -149454,64 +158023,57 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { + "supported": false + }, + "search": { "supported": true, - "default": true + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "meta/llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama 4 Maverick 17B 128E Instruct FP8", - "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", + "id": "qwen3-max-2025-09-23", + "name": "Qwen3 Max 20250923", + "display_name": "Qwen3 Max 20250923", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { + "supported": false + }, + "search": { "supported": true, - "default": true + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "core42/jais-30b-chat", - "name": "JAIS 30b Chat", - "display_name": "JAIS 30b Chat", + "id": "qwen3-max-preview", + "name": "Qwen3 Max Preview", + "display_name": "Qwen3 Max Preview", "modalities": { "input": [ "text" @@ -149521,30 +158083,38 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { "supported": true, - "default": true + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "knowledge": "2023-03", - "release_date": "2023-08-30", - "last_updated": "2023-08-30", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "mistral-ai/mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ "text" @@ -149554,30 +158124,38 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-03", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "mistral-ai/ministral-3b", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -149587,30 +158165,21 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-03", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "mistral-ai/mistral-large-2411", - "name": "Mistral Large 24.11", - "display_name": "Mistral Large 24.11", + "id": "qwen3-30b-a3b-instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ "text" @@ -149620,98 +158189,103 @@ ] }, "limit": { - "context": 128000, + "context": 131072, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "mistral-ai/mistral-small-2503", - "name": "Mistral Small 3.1", - "display_name": "Mistral Small 3.1", + "id": "qwen3-30b-a3b-thinking-2507", + "name": "Qwen3 30B A3B Thinking 2507", + "display_name": "Qwen3 30B A3B Thinking 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-03-01", - "last_updated": "2025-03-01", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "mistral-ai/mistral-medium-2505", - "name": "Mistral Medium 3 (25.05)", - "display_name": "Mistral Medium 3 (25.05)", + "id": "qwen3-30b-a3b", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "mistral-ai/codestral-2501", - "name": "Codestral 25.01", - "display_name": "Codestral 25.01", + "id": "qwen3-4b", + "name": "Qwen3 4B", + "display_name": "Qwen3 4B", "modalities": { "input": [ "text" @@ -149721,39 +158295,38 @@ ] }, "limit": { - "context": 32000, + "context": 131072, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" - } - ] - }, - "neuralwatt": { - "id": "neuralwatt", - "name": "Neuralwatt", - "display_name": "Neuralwatt", - "api": "https://api.neuralwatt.com/v1", - "doc": "https://portal.neuralwatt.com/docs", - "models": [ + }, { - "id": "glm-5-fast", - "name": "GLM 5 Fast", - "display_name": "GLM 5 Fast", + "id": "qwen3-1.7b", + "name": "Qwen3 1.7B", + "display_name": "Qwen3 1.7B", "modalities": { "input": [ "text" @@ -149763,63 +158336,83 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 30720, + "min": 0, + "max": 30720 + } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-07", - "last_updated": "2026-04-07", - "cost": { - "input": 1.1, - "output": 3.6 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "kimi-k2.6-fast", - "name": "Kimi K2.6 Fast", - "display_name": "Kimi K2.6 Fast", + "id": "qwen3-0.6b", + "name": "Qwen3 0.6B", + "display_name": "Qwen3 0.6B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 30720, + "min": 0, + "max": 30720 + } }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", - "cost": { - "input": 0.69, - "output": 3.22 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "qwen3.5-397b-fast", - "name": "Qwen3.5 397B Fast", - "display_name": "Qwen3.5 397B Fast", + "id": "qwen3-vl-plus-2025-09-23", + "name": "Qwen3 VL Plus 2025 09 23", + "display_name": "Qwen3 VL Plus 2025 09 23", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -149827,12 +158420,18 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { @@ -149846,19 +158445,12 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-01", - "last_updated": "2026-02-01", - "cost": { - "input": 0.69, - "output": 4.14 - }, "type": "chat" }, { - "id": "glm-5.1-fast", - "name": "GLM 5.1 Fast", - "display_name": "GLM 5.1 Fast", + "id": "qwq-plus-latest", + "name": "QwQ Plus Latest", + "display_name": "QwQ Plus Latest", "modalities": { "input": [ "text" @@ -149868,32 +158460,53 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { + "supported": true, + "default": true, + "budget": { + "default": 32768, + "min": 0, + "max": 32768 + } + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-07", - "last_updated": "2026-04-07", - "cost": { - "input": 1.1, - "output": 3.6 - }, "type": "chat" - }, + } + ] + }, + "drun": { + "id": "drun", + "name": "D.Run (China)", + "display_name": "D.Run (China)", + "api": "https://chat.d.run/v1", + "doc": "https://www.d.run", + "models": [ { - "id": "qwen3.6-35b-fast", - "name": "Qwen3.6 35B Fast", - "display_name": "Qwen3.6 35B Fast", + "id": "public/deepseek-r1", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -149901,12 +158514,13 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -149919,52 +158533,53 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "knowledge": "2024-12", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.05, - "output": 0.1 + "input": 0.55, + "output": 2.2 }, "type": "chat" }, { - "id": "kimi-k2.5-fast", - "name": "Kimi K2.5 Fast", - "display_name": "Kimi K2.5 Fast", + "id": "public/deepseek-v3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "knowledge": "2024-07", + "release_date": "2024-12-26", + "last_updated": "2024-12-26", "cost": { - "input": 0.52, - "output": 2.59 + "input": 0.28, + "output": 1.1 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-397B-A17B-FP8", - "name": "Qwen3.5 397B A17B FP8", - "display_name": "Qwen3.5 397B A17B FP8", + "id": "public/minimax-m25", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -149974,8 +158589,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -149995,31 +158610,39 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-01", - "last_updated": "2026-02-01", + "open_weights": false, + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 0.69, - "output": 4.14 + "input": 0.29, + "output": 1.16 }, "type": "chat" - }, + } + ] + }, + "huggingface": { + "id": "huggingface", + "name": "Hugging Face", + "display_name": "Hugging Face", + "api": "https://router.huggingface.co/v1", + "doc": "https://huggingface.co/docs/inference-providers", + "models": [ { - "id": "Qwen/Qwen3.6-35B-A3B", - "name": "Qwen3.6 35B A3B", - "display_name": "Qwen3.6 35B A3B", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, @@ -150038,20 +158661,21 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "knowledge": "2025-05", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.05, - "output": 0.1 + "input": 3, + "output": 5 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1-FP8", - "name": "GLM 5.1 FP8", - "display_name": "GLM 5.1 FP8", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ "text" @@ -150061,8 +158685,8 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -150072,61 +158696,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "release_date": "2026-04-07", - "last_updated": "2026-04-07", - "cost": { - "input": 1.1, - "output": 3.6 - }, - "type": "chat" - }, - { - "id": "mistralai/Devstral-Small-2-24B-Instruct-2512", - "name": "Devstral Small 2 24B Instruct 2512", - "display_name": "Devstral Small 2 24B Instruct 2512", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 262144 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.12, - "output": 0.35 + "input": 0.28, + "output": 0.4 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "moonshotai/Kimi-K2-Instruct", + "name": "Kimi-K2-Instruct", + "display_name": "Kimi-K2-Instruct", "modalities": { "input": [ "text" @@ -150136,38 +158723,32 @@ ] }, "limit": { - "context": 16384, + "context": 131072, "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", "cost": { - "input": 0.03, - "output": 0.16 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "Kimi-K2-Thinking", + "display_name": "Kimi-K2-Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -150194,24 +158775,27 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.69, - "output": 3.22 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi-K2.6", + "display_name": "Kimi-K2.6", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" @@ -150240,29 +158824,33 @@ }, "attachment": true, "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "knowledge": "2025-01", + "release_date": "2026-04-20", + "last_updated": "2026-04-20", "cost": { - "input": 0.52, - "output": 2.59 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi-K2.5", + "display_name": "Kimi-K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -150281,28 +158869,22 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2025-01", + "release_date": "2026-01-01", + "last_updated": "2026-01-01", "cost": { - "input": 0.35, - "output": 1.38 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" - } - ] - }, - "togetherai": { - "id": "togetherai", - "name": "Together AI", - "display_name": "Together AI", - "doc": "https://docs.together.ai/docs/serverless-models", - "models": [ + }, { - "id": "essentialai/Rnj-1-Instruct", - "name": "Rnj-1 Instruct", - "display_name": "Rnj-1 Instruct", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi-K2-Instruct-0905", + "display_name": "Kimi-K2-Instruct-0905", "modalities": { "input": [ "text" @@ -150312,8 +158894,8 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -150323,30 +158905,29 @@ "attachment": false, "open_weights": true, "knowledge": "2024-10", - "release_date": "2025-12-05", - "last_updated": "2025-12-05", + "release_date": "2025-09-04", + "last_updated": "2025-09-04", "cost": { - "input": 0.15, - "output": 0.15 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-397B-A17B", - "name": "Qwen3.5 397B A17B", - "display_name": "Qwen3.5 397B A17B", + "id": "zai-org/GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 130000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -150367,18 +158948,20 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { "input": 0.6, - "output": 3.6 + "output": 2.2, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "Qwen/Qwen3.6-Plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "zai-org/GLM-4.7-Flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ "text" @@ -150388,8 +158971,8 @@ ] }, "limit": { - "context": 1000000, - "output": 500000 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -150410,18 +158993,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-04-30", - "last_updated": "2026-04-30", + "knowledge": "2025-04", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 0.5, - "output": 3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-Next-FP8", - "name": "Qwen3 Coder Next FP8", - "display_name": "Qwen3 Coder Next FP8", + "id": "zai-org/GLM-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -150431,8 +159015,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -150440,21 +159024,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2026-02-03", - "release_date": "2026-02-03", - "last_updated": "2026-02-03", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.5, - "output": 1.2 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507-tput", - "name": "Qwen3 235B A22B Instruct 2507 FP8", - "display_name": "Qwen3 235B A22B Instruct 2507 FP8", + "id": "zai-org/GLM-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -150464,8 +159059,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -150473,21 +159068,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "release_date": "2026-04-03", + "last_updated": "2026-04-03", "cost": { - "input": 0.2, - "output": 0.6 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "XiaomiMiMo/MiMo-V2-Flash", + "name": "MiMo-V2-Flash", + "display_name": "MiMo-V2-Flash", "modalities": { "input": [ "text" @@ -150498,28 +159104,29 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "knowledge": "2024-12", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 2, - "output": 2 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "MiniMaxAI/MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -150529,7 +159136,7 @@ ] }, "limit": { - "context": 202752, + "context": 204800, "output": 131072 }, "temperature": true, @@ -150540,24 +159147,30 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "knowledge": "2025-11", - "release_date": "2026-04-07", - "last_updated": "2026-04-07", + "knowledge": "2025-10", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 1.4, - "output": 4.4 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct-Turbo", - "name": "Llama 3.3 70B", - "display_name": "Llama 3.3 70B", + "id": "MiniMaxAI/MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ "text" @@ -150567,29 +159180,41 @@ ] }, "limit": { - "context": 131072, + "context": 204800, "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.88, - "output": 0.88 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -150599,7 +159224,7 @@ ] }, "limit": { - "context": 131072, + "context": 204800, "output": 131072 }, "temperature": true, @@ -150608,21 +159233,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-29", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 1.25, - "output": 1.25 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen3-235B-A22B-Thinking-2507", "modalities": { "input": [ "text" @@ -150632,11 +159268,11 @@ ] }, "limit": { - "context": 163839, - "output": 163839 + "context": 262144, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -150654,19 +159290,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-12-26", - "last_updated": "2025-03-24", + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 3, - "output": 7 + "input": 0.3, + "output": 3 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3-1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen3-Next-80B-A3B-Instruct", + "display_name": "Qwen3-Next-80B-A3B-Instruct", "modalities": { "input": [ "text" @@ -150676,30 +159312,29 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 66536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "knowledge": "2025-04", + "release_date": "2025-09-11", + "last_updated": "2025-09-11", "cost": { - "input": 0.6, - "output": 1.7 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V4-Pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "name": "Qwen3-Next-80B-A3B-Thinking", + "display_name": "Qwen3-Next-80B-A3B-Thinking", "modalities": { "input": [ "text" @@ -150709,14 +159344,13 @@ ] }, "limit": { - "context": 512000, - "output": 384000 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -150731,30 +159365,31 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "knowledge": "2025-04", + "release_date": "2025-09-11", + "last_updated": "2025-09-11", "cost": { - "input": 2.1, - "output": 4.4, - "cache_read": 0.2 + "input": 0.3, + "output": 2 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "Qwen/Qwen3.5-397B-A17B", + "name": "Qwen3.5-397B-A17B", + "display_name": "Qwen3.5-397B-A17B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -150764,63 +159399,65 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-04", + "release_date": "2026-02-01", + "last_updated": "2026-02-01", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "google/gemma-4-31B-it", - "name": "Gemma 4 31B Instruct", - "display_name": "Gemma 4 31B Instruct", + "id": "Qwen/Qwen3-Embedding-4B", + "name": "Qwen 3 Embedding 4B", + "display_name": "Qwen 3 Embedding 4B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 32000, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-07", - "last_updated": "2026-04-07", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.01, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "Qwen/Qwen3-Coder-Next", + "name": "Qwen3-Coder-Next", + "display_name": "Qwen3-Coder-Next", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" @@ -150828,39 +159465,31 @@ }, "limit": { "context": 262144, - "output": 131000 + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "knowledge": "2025-04", + "release_date": "2026-02-03", + "last_updated": "2026-02-03", "cost": { - "input": 1.2, - "output": 4.5, - "cache_read": 0.2 + "input": 0.2, + "output": 1.5 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen3-Coder-480B-A35B-Instruct", + "display_name": "Qwen3-Coder-480B-A35B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -150868,40 +159497,28 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 66536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.5, - "output": 2.8 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "Qwen/Qwen3-Embedding-8B", + "name": "Qwen 3 Embedding 8B", + "display_name": "Qwen 3 Embedding 8B", "modalities": { "input": [ "text" @@ -150911,35 +159528,29 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 32000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.01, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "MiniMaxAI/MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "deepseek-ai/DeepSeek-V4-Pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -150949,8 +159560,8 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, @@ -150971,28 +159582,29 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 }, "type": "chat" } ] }, - "qihang-ai": { - "id": "qihang-ai", - "name": "QiHang", - "display_name": "QiHang", - "api": "https://api.qhaigc.net/v1", - "doc": "https://www.qhaigc.net/docs", + "umans-ai-coding-plan": { + "id": "umans-ai-coding-plan", + "name": "Umans AI Coding Plan", + "display_name": "Umans AI Coding Plan", + "api": "https://api.code.umans.ai/v1", + "doc": "https://app.umans.ai/offers/code/docs", "models": [ { - "id": "claude-opus-4-5-20251101", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "umans-qwen3.6-35b-a3b", + "name": "Qwen3.6 35B A3B", + "display_name": "Qwen3.6 35B A3B", "modalities": { "input": [ "text", @@ -151003,45 +159615,42 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "open_weights": true, + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.71, - "output": 3.57 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "umans-glm-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -151052,41 +159661,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.07, - "output": 0.43, - "context_over_200k": { - "input": 0.07, - "output": 0.43 - } + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5-Mini", - "display_name": "GPT-5-Mini", + "id": "umans-coder", + "name": "Umans Coder", + "display_name": "Umans Coder", "modalities": { "input": [ "text", @@ -151097,10 +159695,10 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -151109,187 +159707,169 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.04, - "output": 0.29 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "umans-flash", + "name": "Umans Flash", + "display_name": "Umans Flash", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65000 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, - "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "open_weights": true, + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.57, - "output": 3.43 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "umans-kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.43, - "output": 2.14 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "tencent-tokenhub": { + "id": "tencent-tokenhub", + "name": "Tencent TokenHub", + "display_name": "Tencent TokenHub", + "api": "https://tokenhub.tencentmaas.com/v1", + "doc": "https://cloud.tencent.com/document/product/1823/130050", + "models": [ { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "hy3-preview", + "name": "Hy3 preview", + "display_name": "Hy3 preview", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-20", + "last_updated": "2026-04-20", "cost": { - "input": 0.25, - "output": 2 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "gitlab": { + "id": "gitlab", + "name": "GitLab Duo", + "display_name": "GitLab Duo", + "doc": "https://docs.gitlab.com/user/duo_agent_platform/", + "models": [ { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "duo-chat-gpt-5-2-codex", + "name": "Agentic Chat (GPT-5.2 Codex)", + "display_name": "Agentic Chat (GPT-5.2 Codex)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -151305,48 +159885,25 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", "cost": { - "input": 0.14, - "output": 1.14 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "duo-chat-haiku-4-5", + "name": "Agentic Chat (Claude Haiku 4.5)", + "display_name": "Agentic Chat (Claude Haiku 4.5)", "modalities": { "input": [ "text", "image", - "video", - "audio", "pdf" ], "output": [ @@ -151354,8 +159911,8 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -151363,45 +159920,23 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2025-02-28", + "release_date": "2026-01-08", + "last_updated": "2026-01-08", "cost": { - "input": 0.09, - "output": 0.71, - "context_over_200k": { - "input": 0.09, - "output": 0.71 - } + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "duo-chat-opus-4-6", + "name": "Agentic Chat (Claude Opus 4.6)", + "display_name": "Agentic Chat (Claude Opus 4.6)", "modalities": { "input": [ "text", @@ -151413,7 +159948,7 @@ ] }, "limit": { - "context": 200000, + "context": 1000000, "output": 64000 }, "temperature": true, @@ -151424,70 +159959,55 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-10-01", - "last_updated": "2025-10-01", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.14, - "output": 0.71 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - } - ] - }, - "tencent-tokenhub": { - "id": "tencent-tokenhub", - "name": "Tencent TokenHub", - "display_name": "Tencent TokenHub", - "api": "https://tokenhub.tencentmaas.com/v1", - "doc": "https://cloud.tencent.com/document/product/1823/130050", - "models": [ + }, { - "id": "hy3-preview", - "name": "Hy3 preview", - "display_name": "Hy3 preview", + "id": "duo-chat-gpt-5-2", + "name": "Agentic Chat (GPT-5.2)", + "display_name": "Agentic Chat (GPT-5.2)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-20", - "last_updated": "2026-04-20", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-01-23", + "last_updated": "2026-01-23", "cost": { "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "output": 0 }, "type": "chat" - } - ] - }, - "anthropic": { - "id": "anthropic", - "name": "Anthropic", - "display_name": "Anthropic", - "doc": "https://docs.anthropic.com/en/docs/about-claude/models", - "models": [ + }, { - "id": "claude-3-sonnet-20240229", - "name": "Claude Sonnet 3", - "display_name": "Claude Sonnet 3", + "id": "duo-chat-gpt-5-3-codex", + "name": "Agentic Chat (GPT-5.3 Codex)", + "display_name": "Agentic Chat (GPT-5.3 Codex)", "modalities": { "input": [ "text", @@ -151499,73 +160019,64 @@ ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-04", - "last_updated": "2024-03-04", + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5 (latest)", - "display_name": "Claude Haiku 4.5 (latest)", + "id": "duo-chat-gpt-5-1", + "name": "Agentic Chat (GPT-5.1)", + "display_name": "Agentic Chat (GPT-5.1)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2024-09-30", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-opus-4-5-20251101", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "duo-chat-opus-4-5", + "name": "Agentic Chat (Claude Opus 4.5)", + "display_name": "Agentic Chat (Claude Opus 4.5)", "modalities": { "input": [ "text", @@ -151589,20 +160100,20 @@ "attachment": true, "open_weights": false, "knowledge": "2025-03-31", - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "release_date": "2026-01-08", + "last_updated": "2026-01-08", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "claude-3-opus-20240229", - "name": "Claude Opus 3", - "display_name": "Claude Opus 3", + "id": "duo-chat-opus-4-7", + "name": "Agentic Chat (Claude Opus 4.7)", + "display_name": "Agentic Chat (Claude Opus 4.7)", "modalities": { "input": [ "text", @@ -151614,31 +160125,32 @@ ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 1000000, + "output": 64000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "claude-3-5-haiku-20241022", - "name": "Claude Haiku 3.5", - "display_name": "Claude Haiku 3.5", + "id": "duo-chat-sonnet-4-5", + "name": "Agentic Chat (Claude Sonnet 4.5)", + "display_name": "Agentic Chat (Claude Sonnet 4.5)", "modalities": { "input": [ "text", @@ -151651,144 +160163,113 @@ }, "limit": { "context": 200000, - "output": 8192 + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2025-07-31", + "release_date": "2026-01-08", + "last_updated": "2026-01-08", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "claude-3-5-sonnet-20241022", - "name": "Claude Sonnet 3.5 v2", - "display_name": "Claude Sonnet 3.5 v2", + "id": "duo-chat-gpt-5-4-nano", + "name": "Agentic Chat (GPT-5.4 Nano)", + "display_name": "Agentic Chat (GPT-5.4 Nano)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "duo-chat-gpt-5-codex", + "name": "Agentic Chat (GPT-5 Codex)", + "display_name": "Agentic Chat (GPT-5 Codex)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "knowledge": "2024-09-30", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-opus-4-0", - "name": "Claude Opus 4 (latest)", - "display_name": "Claude Opus 4 (latest)", + "id": "duo-chat-gpt-5-4-mini", + "name": "Agentic Chat (GPT-5.4 Mini)", + "display_name": "Agentic Chat (GPT-5.4 Mini)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -151796,82 +160277,53 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "duo-chat-gpt-5-mini", + "name": "Agentic Chat (GPT-5 Mini)", + "display_name": "Agentic Chat (GPT-5 Mini)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2024-05-30", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-3-haiku-20240307", - "name": "Claude Haiku 3", - "display_name": "Claude Haiku 3", + "id": "duo-chat-sonnet-4-6", + "name": "Agentic Chat (Claude Sonnet 4.6)", + "display_name": "Agentic Chat (Claude Sonnet 4.6)", "modalities": { "input": [ "text", @@ -151883,31 +160335,32 @@ ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-13", - "last_updated": "2024-03-13", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "duo-chat-gpt-5-5", + "name": "Agentic Chat (GPT-5.5)", + "display_name": "Agentic Chat (GPT-5.5)", "modalities": { "input": [ "text", @@ -151919,10 +160372,10 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -151930,21 +160383,19 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2025-08-31", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-3-5-haiku-latest", - "name": "Claude Haiku 3.5 (latest)", - "display_name": "Claude Haiku 3.5 (latest)", + "id": "duo-chat-gpt-5-4", + "name": "Agentic Chat (GPT-5.4)", + "display_name": "Agentic Chat (GPT-5.4)", "modalities": { "input": [ "text", @@ -151956,44 +160407,50 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 0, + "output": 0 }, "type": "chat" - }, + } + ] + }, + "nebius": { + "id": "nebius", + "name": "Nebius Token Factory", + "display_name": "Nebius Token Factory", + "api": "https://api.tokenfactory.nebius.com/v1", + "doc": "https://docs.tokenfactory.nebius.com/", + "models": [ { - "id": "claude-opus-4-1", - "name": "Claude Opus 4.1 (latest)", - "display_name": "Claude Opus 4.1 (latest)", + "id": "deepseek-ai/DeepSeek-V3.2-fast", + "name": "DeepSeek-V3.2-fast", + "display_name": "DeepSeek-V3.2-fast", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 8000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -152001,41 +160458,34 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2026-05-07", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.4, + "output": 2, + "cache_read": 0.04, + "cache_write": 0.5 }, "type": "chat" }, { - "id": "claude-sonnet-4-0", - "name": "Claude Sonnet 4 (latest)", - "display_name": "Claude Sonnet 4 (latest)", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 163000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -152045,75 +160495,92 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2026-01-20", + "last_updated": "2026-02-04", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.3, + "output": 0.45, + "reasoning": 0.45, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "claude-3-5-sonnet-20240620", - "name": "Claude Sonnet 3.5", - "display_name": "Claude Sonnet 3.5", + "id": "moonshotai/Kimi-K2.5-fast", + "name": "Kimi-K2.5-fast", + "display_name": "Kimi-K2.5-fast", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 256000, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-06-20", - "last_updated": "2024-06-20", + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-12-15", + "last_updated": "2026-02-04", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.5, + "output": 2.5, + "cache_read": 0.05, + "cache_write": 0.625 }, "type": "chat" }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5 (latest)", - "display_name": "Claude Opus 4.5 (latest)", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi-K2.5", + "display_name": "Kimi-K2.5", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -152123,39 +160590,44 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-12-15", + "last_updated": "2026-02-04", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.5, + "output": 2.5, + "reasoning": 2.5, + "cache_read": 0.05, + "cache_write": 0.625 }, "type": "chat" }, { - "id": "claude-opus-4-1-20250805", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "openai/gpt-oss-120b-fast", + "name": "gpt-oss-120b-fast", + "display_name": "gpt-oss-120b-fast", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 8000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -152163,36 +160635,34 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-06-10", + "last_updated": "2026-05-07", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.1, + "output": 0.5, + "cache_read": 0.01, + "cache_write": 0.125 }, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "openai/gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -152200,28 +160670,38 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2026-01-10", + "last_updated": "2026-02-04", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.15, + "output": 0.6, + "reasoning": 0.6, + "cache_read": 0.015, + "cache_write": 0.18 }, "type": "chat" }, { - "id": "claude-sonnet-4-20250514", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "zai-org/GLM-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -152229,7 +160709,7 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -152237,156 +160717,139 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2026-01", + "release_date": "2026-03-01", + "last_updated": "2026-03-10", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1, + "output": 3.2, + "cache_read": 0.1, + "cache_write": 1 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "NousResearch/Hermes-4-405B", + "name": "Hermes-4-405B", + "display_name": "Hermes-4-405B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2026-01-30", + "last_updated": "2026-02-04", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1, + "output": 3, + "reasoning": 3, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-20250219", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "NousResearch/Hermes-4-70B", + "name": "Hermes-4-70B", + "display_name": "Hermes-4-70B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", + "interleaved": true, + "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "attachment": false, + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2026-01-30", + "last_updated": "2026-02-04", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.13, + "output": 0.4, + "reasoning": 0.4, + "cache_read": 0.013, + "cache_write": 0.16 }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5 (latest)", - "display_name": "Claude Sonnet 4.5 (latest)", + "id": "nvidia/Nemotron-3-Nano-Omni", + "name": "Nemotron-3-Nano-Omni", + "display_name": "Nemotron-3-Nano-Omni", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 65536, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -152394,41 +160857,68 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2026-05-07", + "cost": { + "input": 0.06, + "output": 0.24, + "cache_read": 0.006, + "cache_write": 0.075 }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "type": "chat" + }, + { + "id": "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B", + "name": "Nemotron-3-Nano-30B-A3B", + "display_name": "Nemotron-3-Nano-30B-A3B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2025-08-10", + "last_updated": "2026-02-04", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.06, + "output": 0.24, + "cache_read": 0.006, + "cache_write": 0.075 }, "type": "chat" }, { - "id": "claude-opus-4-20250514", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "nvidia/nemotron-3-super-120b-a12b", + "name": "Nemotron-3-Super-120B-A12B", + "display_name": "Nemotron-3-Super-120B-A12B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 256000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -152436,32 +160926,21 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "knowledge": "2026-02", + "release_date": "2026-03-11", + "last_updated": "2026-03-12", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" - } - ] - }, - "modelscope": { - "id": "modelscope", - "name": "ModelScope", - "display_name": "ModelScope", - "api": "https://api-inference.modelscope.cn/v1", - "doc": "https://modelscope.cn/docs/model-service/API-Inference/intro", - "models": [ + "input": 0.3, + "output": 0.9 + }, + "type": "chat" + }, { - "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", - "name": "Qwen3 30B A3B Thinking 2507", - "display_name": "Qwen3 30B A3B Thinking 2507", + "id": "nvidia/Llama-3_1-Nemotron-Ultra-253B-v1", + "name": "Llama-3.1-Nemotron-Ultra-253B-v1", + "display_name": "Llama-3.1-Nemotron-Ultra-253B-v1", "modalities": { "input": [ "text" @@ -152471,73 +160950,66 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "knowledge": "2024-12", + "release_date": "2025-01-15", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 1.8, + "cache_read": 0.06, + "cache_write": 0.75 }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", + "id": "google/gemma-3-27b-it", + "name": "Gemma-3-27b-it", + "display_name": "Gemma-3-27b-it", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 110000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "knowledge": "2025-10", + "release_date": "2026-01-20", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.3, + "cache_read": 0.01, + "cache_write": 0.125 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "google/gemma-2-2b-it", + "name": "Gemma-2-2b-it", + "display_name": "Gemma-2-2b-it", "modalities": { "input": [ "text" @@ -152547,29 +161019,31 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 8192, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2025-07-21", + "knowledge": "2024-06", + "release_date": "2024-07-31", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0 + "input": 0.02, + "output": 0.06, + "cache_read": 0.002, + "cache_write": 0.025 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" @@ -152579,8 +161053,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -152589,19 +161063,21 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-31", - "last_updated": "2025-07-31", + "knowledge": "2024-12", + "release_date": "2024-07-23", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0 + "input": 0.02, + "output": 0.06, + "cache_read": 0.002, + "cache_write": 0.025 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen3-235B-A22B-Thinking-2507", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -152611,41 +161087,31 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "knowledge": "2025-08", + "release_date": "2025-12-05", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0 + "input": 0.13, + "output": 0.4, + "cache_read": 0.013, + "cache_write": 0.16 }, "type": "chat" }, { - "id": "ZhipuAI/GLM-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "MiniMaxAI/MiniMax-M2.5-fast", + "name": "MiniMax-M2.5-fast", + "display_name": "MiniMax-M2.5-fast", "modalities": { "input": [ "text" @@ -152655,8 +161121,8 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 8000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -152666,19 +161132,21 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2026-05-07", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "ZhipuAI/GLM-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -152688,8 +161156,8 @@ ] }, "limit": { - "context": 202752, - "output": 98304 + "context": 196608, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -152704,28 +161172,21 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2026-05-07", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" - } - ] - }, - "hpc-ai": { - "id": "hpc-ai", - "name": "HPC-AI", - "display_name": "HPC-AI", - "api": "https://api.hpc-ai.com/inference/v1", - "doc": "https://www.hpc-ai.com/doc/docs/quickstart/", - "models": [ + }, { - "id": "zai-org/glm-5.1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "PrimeIntellect/INTELLECT-3", + "name": "INTELLECT-3", + "display_name": "INTELLECT-3", "modalities": { "input": [ "text" @@ -152735,41 +161196,31 @@ ] }, "limit": { - "context": 202000, - "output": 202000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "knowledge": "2025-10", + "release_date": "2026-01-25", + "last_updated": "2026-02-04", "cost": { - "input": 0.66, - "output": 2, - "cache_read": 0.12 + "input": 0.2, + "output": 1.1, + "cache_read": 0.02, + "cache_write": 0.25 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "name": "Qwen3-Next-80B-A3B-Thinking", + "display_name": "Qwen3-Next-80B-A3B-Thinking", "modalities": { "input": [ "text" @@ -152779,8 +161230,8 @@ ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -152790,43 +161241,49 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-03-25", + "knowledge": "2025-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-04", "cost": { - "input": 0.14, - "output": 0.56, - "cache_read": 0.014 + "input": 0.15, + "output": 1.2, + "reasoning": 1.2, + "cache_read": 0.015, + "cache_write": 0.18 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "Qwen/Qwen3-32B", + "name": "Qwen3-32B", + "display_name": "Qwen3-32B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -152841,62 +161298,55 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01-01", - "release_date": "2026-01-01", - "last_updated": "2026-03-25", + "knowledge": "2025-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-04", "cost": { - "input": 0.21, - "output": 1, - "cache_read": 0.03 + "input": 0.1, + "output": 0.3, + "cache_read": 0.01, + "cache_write": 0.125 }, "type": "chat" - } - ] - }, - "gitlab": { - "id": "gitlab", - "name": "GitLab Duo", - "display_name": "GitLab Duo", - "doc": "https://docs.gitlab.com/user/duo_agent_platform/", - "models": [ + }, { - "id": "duo-chat-gpt-5-4-nano", - "name": "Agentic Chat (GPT-5.4 Nano)", - "display_name": "Agentic Chat (GPT-5.4 Nano)", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen3-30B-A3B-Instruct-2507", + "display_name": "Qwen3-30B-A3B-Instruct-2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.3, + "cache_read": 0.01, + "cache_write": 0.125 }, "type": "chat" }, { - "id": "duo-chat-gpt-5-mini", - "name": "Agentic Chat (GPT-5 Mini)", - "display_name": "Agentic Chat (GPT-5 Mini)", + "id": "Qwen/Qwen2.5-VL-72B-Instruct", + "name": "Qwen2.5-VL-72B-Instruct", + "display_name": "Qwen2.5-VL-72B-Instruct", "modalities": { "input": [ "text", @@ -152907,43 +161357,42 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2026-01-22", - "last_updated": "2026-01-22", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-20", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 0.75, + "cache_read": 0.025, + "cache_write": 0.31 }, "type": "chat" }, { - "id": "duo-chat-sonnet-4-6", - "name": "Agentic Chat (Claude Sonnet 4.6)", - "display_name": "Agentic Chat (Claude Sonnet 4.6)", + "id": "Qwen/Qwen3.5-397B-A17B-fast", + "name": "Qwen3.5-397B-A17B-fast", + "display_name": "Qwen3.5-397B-A17B-fast", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 8000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -152951,342 +161400,435 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-15", + "last_updated": "2026-05-07", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.6, + "output": 3.6, + "cache_read": 0.06, + "cache_write": 0.75 }, "type": "chat" }, { - "id": "duo-chat-gpt-5-2", - "name": "Agentic Chat (GPT-5.2)", - "display_name": "Agentic Chat (GPT-5.2)", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-01-23", - "last_updated": "2026-01-23", + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-10-04", "cost": { - "input": 0, - "output": 0 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "duo-chat-gpt-5-codex", - "name": "Agentic Chat (GPT-5 Codex)", - "display_name": "Agentic Chat (GPT-5 Codex)", + "id": "Qwen/Qwen3-Next-80B-A3B-Thinking-fast", + "name": "Qwen3-Next-80B-A3B-Thinking-fast", + "display_name": "Qwen3-Next-80B-A3B-Thinking-fast", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2026-01-22", - "last_updated": "2026-01-22", + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2026-05-07", "cost": { - "input": 0, - "output": 0 + "input": 0.15, + "output": 1.2, + "cache_read": 0.015, + "cache_write": 0.1875 }, "type": "chat" }, { - "id": "duo-chat-gpt-5-1", - "name": "Agentic Chat (GPT-5.1)", - "display_name": "Agentic Chat (GPT-5.1)", + "id": "Qwen/Qwen3.5-397B-A17B", + "name": "Qwen3.5-397B-A17B", + "display_name": "Qwen3.5-397B-A17B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2026-01-22", - "last_updated": "2026-01-22", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-15", + "last_updated": "2026-05-07", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 3.6, + "cache_read": 0.06, + "cache_write": 0.75 }, "type": "chat" }, { - "id": "duo-chat-gpt-5-2-codex", - "name": "Agentic Chat (GPT-5.2 Codex)", - "display_name": "Agentic Chat (GPT-5.2 Codex)", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507-fast", + "name": "Qwen3-235B-A22B-Thinking-2507-fast", + "display_name": "Qwen3-235B-A22B-Thinking-2507-fast", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-01-22", - "last_updated": "2026-01-22", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2026-05-07", "cost": { - "input": 0, - "output": 0 + "input": 0.5, + "output": 2, + "cache_read": 0.05, + "cache_write": 0.625 }, "type": "chat" }, { - "id": "duo-chat-sonnet-4-5", - "name": "Agentic Chat (Claude Sonnet 4.5)", - "display_name": "Agentic Chat (Claude Sonnet 4.5)", + "id": "Qwen/Qwen3-Embedding-8B", + "name": "Qwen3-Embedding-8B", + "display_name": "Qwen3-Embedding-8B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2026-01-08", - "last_updated": "2026-01-08", + "attachment": false, + "open_weights": true, + "knowledge": "2025-10", + "release_date": "2026-01-10", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.01, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "duo-chat-gpt-5-4", - "name": "Agentic Chat (GPT-5.4)", - "display_name": "Agentic Chat (GPT-5.4)", + "id": "deepseek-ai/DeepSeek-V4-Pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 1000000, + "output": 384000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0, - "output": 0 + "input": 1.75, + "output": 3.5, + "cache_read": 0.15 }, "type": "chat" - }, + } + ] + }, + "hpc-ai": { + "id": "hpc-ai", + "name": "HPC-AI", + "display_name": "HPC-AI", + "api": "https://api.hpc-ai.com/inference/v1", + "doc": "https://www.hpc-ai.com/doc/docs/quickstart/", + "models": [ { - "id": "duo-chat-haiku-4-5", - "name": "Agentic Chat (Claude Haiku 4.5)", - "display_name": "Agentic Chat (Claude Haiku 4.5)", + "id": "moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2026-01-08", - "last_updated": "2026-01-08", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01-01", + "release_date": "2026-01-01", + "last_updated": "2026-03-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.21, + "output": 1, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "duo-chat-gpt-5-3-codex", - "name": "Agentic Chat (GPT-5.3 Codex)", - "display_name": "Agentic Chat (GPT-5.3 Codex)", + "id": "zai-org/glm-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 202000, + "output": 202000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-04-08", + "last_updated": "2026-04-08", "cost": { - "input": 0, - "output": 0 + "input": 0.66, + "output": 2, + "cache_read": 0.12 }, "type": "chat" }, { - "id": "duo-chat-gpt-5-4-mini", - "name": "Agentic Chat (GPT-5.4 Mini)", - "display_name": "Agentic Chat (GPT-5.4 Mini)", + "id": "minimax/minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-03-25", "cost": { - "input": 0, - "output": 0 + "input": 0.14, + "output": 0.56, + "cache_read": 0.014 }, "type": "chat" - }, + } + ] + }, + "xiaomi": { + "id": "xiaomi", + "name": "Xiaomi", + "display_name": "Xiaomi", + "api": "https://api.xiaomimimo.com/v1", + "doc": "https://platform.xiaomimimo.com/#/docs", + "models": [ { - "id": "duo-chat-opus-4-7", - "name": "Agentic Chat (Claude Opus 4.7)", - "display_name": "Agentic Chat (Claude Opus 4.7)", + "id": "mimo-v2-omni", + "name": "MiMo-V2-Omni", + "display_name": "MiMo-V2-Omni", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -153294,45 +161836,53 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.4, + "output": 2, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "duo-chat-opus-4-5", - "name": "Agentic Chat (Claude Opus 4.5)", - "display_name": "Agentic Chat (Claude Opus 4.5)", + "id": "mimo-v2.5-pro", + "name": "MiMo-V2.5-Pro", + "display_name": "MiMo-V2.5-Pro", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -153340,36 +161890,60 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2026-01-08", - "last_updated": "2026-01-08", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 1, + "output": 3, + "cache_read": 0.2, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "duo-chat-opus-4-6", - "name": "Agentic Chat (Claude Opus 4.6)", - "display_name": "Agentic Chat (Claude Opus 4.6)", + "id": "mimo-v2-flash", + "name": "MiMo-V2-Flash", + "display_name": "MiMo-V2-Flash", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -153377,32 +161951,33 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.1, + "output": 0.3, + "cache_read": 0.01 }, "type": "chat" - } - ] - }, - "xiaomi": { - "id": "xiaomi", - "name": "Xiaomi", - "display_name": "Xiaomi", - "api": "https://api.xiaomimimo.com/v1", - "doc": "https://platform.xiaomimimo.com/#/docs", - "models": [ + }, { - "id": "mimo-v2.5-pro", - "name": "MiMo-V2.5-Pro", - "display_name": "MiMo-V2.5-Pro", + "id": "mimo-v2-pro", + "name": "MiMo-V2-Pro", + "display_name": "MiMo-V2-Pro", "modalities": { "input": [ "text" @@ -153433,14 +162008,25 @@ } }, "attachment": false, - "open_weights": true, + "open_weights": false, "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { "input": 1, "output": 3, "cache_read": 0.2, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ], "context_over_200k": { "input": 2, "output": 6, @@ -153450,23 +162036,22 @@ "type": "chat" }, { - "id": "mimo-v2-omni", - "name": "MiMo-V2-Omni", - "display_name": "MiMo-V2-Omni", + "id": "mimo-v2.5", + "name": "MiMo-V2.5", + "display_name": "MiMo-V2.5", "modalities": { "input": [ "text", "image", "audio", - "video", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1048576, "output": 131072 }, "temperature": true, @@ -153487,189 +162072,241 @@ } }, "attachment": true, - "open_weights": false, + "open_weights": true, "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { "input": 0.4, "output": 2, - "cache_read": 0.08 + "cache_read": 0.08, + "tiers": [ + { + "input": 0.8, + "output": 4, + "cache_read": 0.16, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 0.8, + "output": 4, + "cache_read": 0.16 + } }, "type": "chat" - }, + } + ] + }, + "github-copilot": { + "id": "github-copilot", + "name": "GitHub Copilot", + "display_name": "GitHub Copilot", + "api": "https://api.githubcopilot.com", + "doc": "https://docs.github.com/en/copilot", + "models": [ { - "id": "mimo-v2.5", - "name": "MiMo-V2.5", - "display_name": "MiMo-V2.5", + "id": "claude-opus-41", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 80000, + "output": 16000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + }, + { + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08, - "context_over_200k": { - "input": 0.8, - "output": 4, - "cache_read": 0.16 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mimo-v2-pro", - "name": "MiMo-V2-Pro", - "display_name": "MiMo-V2-Pro", + "id": "claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2, - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mimo-v2-flash", - "name": "MiMo-V2-Flash", - "display_name": "MiMo-V2-Flash", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 264000, + "output": 64000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01 + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "clarifai": { - "id": "clarifai", - "name": "Clarifai", - "display_name": "Clarifai", - "api": "https://api.clarifai.com/v2/ext/openai/v1", - "doc": "https://docs.clarifai.com/compute/inference/", - "models": [ + }, { - "id": "arcee_ai/AFM/models/trinity-mini", - "name": "Trinity Mini", - "display_name": "Trinity Mini", + "id": "claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 144000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -153677,33 +162314,35 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-12", - "last_updated": "2026-02-25", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.045, - "output": 0.15 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mistralai/completion/models/Ministral-3-14B-Reasoning-2512", - "name": "Ministral 3 14B Reasoning 2512", - "display_name": "Ministral 3 14B Reasoning 2512", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -153711,21 +162350,40 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-01", - "last_updated": "2025-12-12", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 2.5, - "output": 1.7 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mistralai/completion/models/Ministral-3-3B-Reasoning-2512", - "name": "Ministral 3 3B Reasoning 2512", - "display_name": "Ministral 3 3B Reasoning 2512", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1-Codex-mini", + "display_name": "GPT-5.1-Codex-mini", "modalities": { "input": [ "text", @@ -153736,141 +162394,196 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-12", - "last_updated": "2026-02-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 1.039, - "output": 0.54825 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-ocr/models/DeepSeek-OCR", - "name": "DeepSeek OCR", - "display_name": "DeepSeek OCR", + "id": "grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-10-20", - "last_updated": "2026-02-25", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-08", + "release_date": "2025-08-27", + "last_updated": "2025-08-27", "cost": { - "input": 0.2, - "output": 0.7 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/chat-completion/models/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "claude-opus-4.6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 144000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-12-12", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.045, - "output": 0.18 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/chat-completion/models/gpt-oss-120b-high-throughput", - "name": "GPT OSS 120B High Throughput", - "display_name": "GPT OSS 120B High Throughput", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 128000, "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2026-02-25", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.09, - "output": 0.36 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "minimaxai/chat-completion/models/MiniMax-M2_5-high-throughput", - "name": "MiniMax-M2.5 High Throughput", - "display_name": "MiniMax-M2.5 High Throughput", + "id": "gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -153878,159 +162591,239 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwenCoder/models/Qwen3-Coder-30B-A3B-Instruct", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 264000, + "output": 64000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-31", - "last_updated": "2026-02-12", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.11458, - "output": 0.74812 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwenLM/models/Qwen3-30B-A3B-Thinking-2507", - "name": "Qwen3 30B A3B Thinking 2507", - "display_name": "Qwen3 30B A3B Thinking 2507", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-31", - "last_updated": "2026-02-25", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.36, - "output": 1.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwenLM/models/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", + "id": "gpt-5.4-mini", + "name": "GPT-5.4 Mini", + "display_name": "GPT-5.4 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-30", - "last_updated": "2026-02-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.3, - "output": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "clarifai/main/models/mm-poly-8b", - "name": "MM Poly 8B", - "display_name": "MM Poly 8B", + "id": "claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 144000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-06", - "last_updated": "2026-02-25", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.658, - "output": 1.11 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "moonshotai/chat-completion/models/Kimi-K2_6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ "text", @@ -154041,8 +162834,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -154053,88 +162846,104 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, - "open_weights": true, + "open_weights": false, "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.95, - "output": 4 + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "minimax-cn": { - "id": "minimax-cn", - "name": "MiniMax (minimaxi.com)", - "display_name": "MiniMax (minimaxi.com)", - "api": "https://api.minimaxi.com/anthropic/v1", - "doc": "https://platform.minimaxi.com/docs/guides/quickstart", - "models": [ + }, { - "id": "MiniMax-M2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1-Codex-max", + "display_name": "GPT-5.1-Codex-max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 196608, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-12-04", + "last_updated": "2025-12-04", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -154142,36 +162951,54 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash", + "display_name": "Gemini 3 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -154182,41 +163009,49 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "MiniMax-M2.7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "claude-opus-4.5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 160000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -154224,44 +163059,33 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 216000, + "output": 16000 }, "temperature": true, "tool_call": true, @@ -154269,198 +163093,299 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "MiniMax-M2.5-highspeed", - "name": "MiniMax-M2.5-highspeed", - "display_name": "MiniMax-M2.5-highspeed", + "id": "gpt-5.1-codex", + "name": "GPT-5.1-Codex", + "display_name": "GPT-5.1-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-13", - "last_updated": "2026-02-13", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "regolo-ai": { - "id": "regolo-ai", - "name": "Regolo AI", - "display_name": "Regolo AI", - "api": "https://api.regolo.ai/v1", - "doc": "https://docs.regolo.ai/", - "models": [ + }, { - "id": "mistral-small3.2", - "name": "Mistral Small 3.2", - "display_name": "Mistral Small 3.2", + "id": "gpt-5.2-codex", + "name": "GPT-5.2-Codex", + "display_name": "GPT-5.2-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 120000, - "output": 120000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": false, "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.5, - "output": 2.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-embedding-8b", - "name": "Qwen3-Embedding-8B", - "display_name": "Qwen3-Embedding-8B", + "id": "gpt-5-mini", + "name": "GPT-5-mini", + "display_name": "GPT-5-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 264000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-01", - "last_updated": "2026-02-01", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2025-08-13", + "last_updated": "2025-08-13", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0, + "output": 0 }, - "type": "embedding" + "type": "chat" }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "gpt-5.3-codex", + "name": "GPT-5.3-Codex", + "display_name": "GPT-5.3-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "knowledge": "2025-08-31", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0.6, - "output": 2.7 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-reranker-4b", - "name": "Qwen3-Reranker-4B", - "display_name": "Qwen3-Reranker-4B", + "id": "claude-opus-4.7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 144000, + "output": 64000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-01", - "last_updated": "2026-02-01", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.12, - "output": 0.12 + "input": 0, + "output": 0 }, - "type": "rerank" + "type": "chat" }, { - "id": "mistral-small-4-119b", - "name": "Mistral Small 4 119B", - "display_name": "Mistral Small 4 119B", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", @@ -154471,8 +163396,8 @@ ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -154480,35 +163405,64 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.75, - "output": 3 + "input": 0, + "output": 0 }, "type": "chat" - }, + } + ] + }, + "togetherai": { + "id": "togetherai", + "name": "Together AI", + "display_name": "Together AI", + "doc": "https://docs.together.ai/docs/serverless-models", + "models": [ { - "id": "qwen3.5-122b", - "name": "Qwen3.5-122B", - "display_name": "Qwen3.5-122B", + "id": "deepseek-ai/DeepSeek-R1", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 163839, + "output": 163839 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -154524,51 +163478,65 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-02-01", - "last_updated": "2026-02-01", + "knowledge": "2024-07", + "release_date": "2024-12-26", + "last_updated": "2025-03-24", "cost": { - "input": 0.9, - "output": 3.6 + "input": 3, + "output": 7 }, "type": "chat" }, { - "id": "qwen-image", - "name": "Qwen-Image", - "display_name": "Qwen-Image", + "id": "deepseek-ai/DeepSeek-V4-Pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 512000, + "output": 384000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-01", - "last_updated": "2026-03-01", + "open_weights": true, + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.5, - "output": 2 + "input": 2.1, + "output": 4.4, + "cache_read": 0.2 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "qwen3-coder-next", - "name": "Qwen3-Coder-Next", - "display_name": "Qwen3-Coder-Next", + "id": "deepseek-ai/DeepSeek-V3-1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text" @@ -154578,8 +163546,8 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -154589,18 +163557,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-01", - "last_updated": "2026-03-01", + "knowledge": "2025-08", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.6, + "output": 1.7 }, "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax 2.5", - "display_name": "MiniMax 2.5", + "id": "deepseek-ai/DeepSeek-V3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ "text" @@ -154610,8 +163579,8 @@ ] }, "limit": { - "context": 190000, - "output": 64000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -154619,36 +163588,34 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-10", - "last_updated": "2026-03-10", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", "cost": { - "input": 0.8, - "output": 3.5 + "input": 1.25, + "output": 1.25 }, "type": "chat" }, { - "id": "gpt-oss-20b", - "name": "GPT-OSS-20B", - "display_name": "GPT-OSS-20B", + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -154661,20 +163628,22 @@ "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-03-01", - "last_updated": "2026-03-01", + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.4, - "output": 1.8 + "input": 1.2, + "output": 4.5, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "qwen3.5-9b", - "name": "Qwen3.5-9B", - "display_name": "Qwen3.5-9B", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", @@ -154686,7 +163655,7 @@ }, "limit": { "context": 262144, - "output": 8192 + "output": 262144 }, "temperature": true, "tool_call": true, @@ -154705,20 +163674,21 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-02-01", - "last_updated": "2026-02-01", + "knowledge": "2026-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.5, + "output": 2.8 }, "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "GPT-OSS-120B", - "display_name": "GPT-OSS-120B", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -154728,8 +163698,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -154743,19 +163713,20 @@ } }, "attachment": false, - "open_weights": false, + "open_weights": true, + "knowledge": "2025-08", "release_date": "2025-08-05", "last_updated": "2025-08-05", "cost": { - "input": 1, - "output": 4.2 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "zai-org/GLM-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -154765,70 +163736,39 @@ ] }, "limit": { - "context": 120000, - "output": 120000 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-07", - "last_updated": "2025-04-07", - "cost": { - "input": 0.05, - "output": 0.25 - }, - "type": "chat" - } - ] - }, - "xiaomi-token-plan-ams": { - "id": "xiaomi-token-plan-ams", - "name": "Xiaomi Token Plan (Europe)", - "display_name": "Xiaomi Token Plan (Europe)", - "api": "https://token-plan-ams.xiaomimimo.com/v1", - "doc": "https://platform.xiaomimimo.com/#/docs", - "models": [ - { - "id": "mimo-v2-tts", - "name": "MiMo-V2-TTS", - "display_name": "MiMo-V2-TTS", - "modalities": { - "input": [ - "text" - ], - "output": [ - "audio" - ] - }, - "limit": { - "context": 8192, - "output": 16384 + "supported": true, + "default": true }, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-11", + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 0, - "output": 0 + "input": 1.4, + "output": 4.4 }, "type": "chat" }, { - "id": "mimo-v2-flash", - "name": "MiMo-V2-Flash", - "display_name": "MiMo-V2-Flash", + "id": "google/gemma-4-31B-it", + "name": "Gemma 4 31B Instruct", + "display_name": "Gemma 4 31B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -154836,7 +163776,7 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -154844,33 +163784,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", + "knowledge": "2025-01", + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "mimo-v2-pro", - "name": "MiMo-V2-Pro", - "display_name": "MiMo-V2-Pro", + "id": "meta-llama/Llama-3.3-70B-Instruct-Turbo", + "name": "Llama 3.3 70B", + "display_name": "Llama 3.3 70B", "modalities": { "input": [ "text" @@ -154880,114 +163808,71 @@ ] }, "limit": { - "context": 1048576, + "context": 131072, "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0.88, + "output": 0.88 }, "type": "chat" }, { - "id": "mimo-v2.5", - "name": "MiMo-V2.5", - "display_name": "MiMo-V2.5", + "id": "essentialai/Rnj-1-Instruct", + "name": "Rnj-1 Instruct", + "display_name": "Rnj-1 Instruct", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "knowledge": "2024-10", + "release_date": "2025-12-05", + "last_updated": "2025-12-05", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "context_over_200k": { - "input": 0, - "output": 0, - "cache_read": 0 - } + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "mimo-v2-omni", - "name": "MiMo-V2-Omni", - "display_name": "MiMo-V2-Omni", + "id": "MiniMaxAI/MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 202752, "output": 131072 }, "temperature": true, @@ -155007,22 +163892,21 @@ ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-12", + "attachment": false, + "open_weights": true, "release_date": "2026-03-18", "last_updated": "2026-03-18", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "mimo-v2.5-pro", - "name": "MiMo-V2.5-Pro", - "display_name": "MiMo-V2.5-Pro", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -155032,7 +163916,7 @@ ] }, "limit": { - "context": 1048576, + "context": 204800, "output": 131072 }, "temperature": true, @@ -155043,93 +163927,56 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "context_over_200k": { - "input": 0, - "output": 0, - "cache_read": 0 - } + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" - } - ] - }, - "zhipuai": { - "id": "zhipuai", - "name": "Zhipu AI", - "display_name": "Zhipu AI", - "api": "https://open.bigmodel.cn/api/paas/v4", - "doc": "https://docs.z.ai/guides/overview/pricing", - "models": [ + }, { - "id": "glm-5v-turbo", - "name": "GLM-5V-Turbo", - "display_name": "GLM-5V-Turbo", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ - "text", - "image", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 5, - "output": 22, - "cache_read": 1.2, - "cache_write": 0 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507-tput", + "name": "Qwen3 235B A22B Instruct 2507 FP8", + "display_name": "Qwen3 235B A22B Instruct 2507 FP8", "modalities": { "input": [ "text" @@ -155139,8 +163986,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -155148,33 +163995,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2, - "cache_write": 0 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "Qwen/Qwen3.6-Plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ "text" @@ -155184,8 +164019,8 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 1000000, + "output": 500000 }, "temperature": true, "tool_call": true, @@ -155205,21 +164040,19 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "open_weights": true, + "release_date": "2026-04-30", + "last_updated": "2026-04-30", "cost": { - "input": 6, - "output": 24, - "cache_read": 1.3, - "cache_write": 0 + "input": 0.5, + "output": 3 }, "type": "chat" }, { - "id": "glm-4.7-flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "Qwen/Qwen3-Coder-Next-FP8", + "name": "Qwen3 Coder Next FP8", + "display_name": "Qwen3 Coder Next FP8", "modalities": { "input": [ "text" @@ -155229,8 +164062,8 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -155238,39 +164071,33 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "knowledge": "2026-02-03", + "release_date": "2026-02-03", + "last_updated": "2026-02-03", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.5, + "output": 1.2 }, "type": "chat" }, { - "id": "glm-4.5-flash", - "name": "GLM-4.5-Flash", - "display_name": "GLM-4.5-Flash", + "id": "Qwen/Qwen3.5-397B-A17B", + "name": "Qwen3.5 397B A17B", + "display_name": "Qwen3.5 397B A17B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 262144, + "output": 130000 }, "temperature": true, "tool_call": true, @@ -155278,58 +164105,72 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.6, + "output": 3.6 }, "type": "chat" - }, + } + ] + }, + "inference": { + "id": "inference", + "name": "Inference", + "display_name": "Inference", + "api": "https://inference.net/v1", + "doc": "https://inference.net/models", + "models": [ { - "id": "glm-4.6v", - "name": "GLM-4.6V", - "display_name": "GLM-4.6V", + "id": "osmosis/osmosis-structure-0.6b", + "name": "Osmosis Structure 0.6B", + "display_name": "Osmosis Structure 0.6B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 4000, + "output": 2048 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.1, + "output": 0.5 }, "type": "chat" }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "mistral/mistral-nemo-12b-instruct", + "name": "Mistral Nemo 12B Instruct", + "display_name": "Mistral Nemo 12B Instruct", "modalities": { "input": [ "text" @@ -155339,72 +164180,62 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 16000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.038, + "output": 0.1 }, "type": "chat" }, { - "id": "glm-4.5v", - "name": "GLM-4.5V", - "display_name": "GLM-4.5V", + "id": "qwen/qwen-2.5-7b-vision-instruct", + "name": "Qwen 2.5 7B Vision Instruct", + "display_name": "Qwen 2.5 7B Vision Instruct", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 125000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.6, - "output": 1.8 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "qwen/qwen3-embedding-4b", + "name": "Qwen 3 Embedding 4B", + "display_name": "Qwen 3 Embedding 4B", "modalities": { "input": [ "text" @@ -155414,67 +164245,62 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 32000, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.2, - "output": 1.1, - "cache_read": 0.03, - "cache_write": 0 + "input": 0.01, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "google/gemma-3", + "name": "Google Gemma 3", + "display_name": "Google Gemma 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 125000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.15, + "output": 0.3 }, "type": "chat" }, { - "id": "glm-4.7-flashx", - "name": "GLM-4.7-FlashX", - "display_name": "GLM-4.7-FlashX", + "id": "meta/llama-3.2-1b-instruct", + "name": "Llama 3.2 1B Instruct", + "display_name": "Llama 3.2 1B Instruct", "modalities": { "input": [ "text" @@ -155484,152 +164310,119 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 16000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.07, - "output": 0.4, - "cache_read": 0.01, - "cache_write": 0 + "input": 0.01, + "output": 0.01 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "meta/llama-3.2-11b-vision-instruct", + "name": "Llama 3.2 11B Vision Instruct", + "display_name": "Llama 3.2 11B Vision Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 16000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.055, + "output": 0.055 }, "type": "chat" - } - ] - }, - "nova": { - "id": "nova", - "name": "Nova", - "display_name": "Nova", - "api": "https://api.nova.amazon.com/v1", - "doc": "https://nova.amazon.com/dev/documentation", - "models": [ + }, { - "id": "nova-2-lite-v1", - "name": "Nova 2 Lite", - "display_name": "Nova 2 Lite", + "id": "meta/llama-3.2-3b-instruct", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ - "text", - "image", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 16000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0, - "output": 0, - "reasoning": 0 + "input": 0.02, + "output": 0.02 }, "type": "chat" }, { - "id": "nova-2-pro-v1", - "name": "Nova 2 Pro", - "display_name": "Nova 2 Pro", + "id": "meta/llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 16000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-03", - "last_updated": "2026-01-03", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0, - "output": 0, - "reasoning": 0 + "input": 0.025, + "output": 0.025 }, "type": "chat" } @@ -167648,9 +176441,9 @@ "type": "chat" }, { - "id": "minimax-m2.7", - "name": "minimax-m2.7", - "display_name": "minimax-m2.7", + "id": "minimax-m2.1", + "name": "minimax-m2.1", + "display_name": "minimax-m2.1", "modalities": { "input": [ "text" @@ -167660,8 +176453,8 @@ ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 204800, + "output": 131072 }, "tool_call": true, "reasoning": { @@ -167670,19 +176463,13 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2025-12-23", + "last_updated": "2026-01-19", "type": "chat" }, { @@ -167725,9 +176512,9 @@ "type": "chat" }, { - "id": "glm-4.7", - "name": "glm-4.7", - "display_name": "glm-4.7", + "id": "glm-5.1", + "name": "glm-5.1", + "display_name": "glm-5.1", "modalities": { "input": [ "text" @@ -167758,18 +176545,17 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-22", - "last_updated": "2026-01-19", + "release_date": "2026-03-27", + "last_updated": "2026-04-07", "type": "chat" }, { - "id": "qwen3.5:397b", - "name": "qwen3.5:397b", - "display_name": "qwen3.5:397b", + "id": "kimi-k2:1t", + "name": "kimi-k2:1t", + "display_name": "kimi-k2:1t", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -167777,34 +176563,54 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 262144 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-11", + "last_updated": "2026-01-19", + "type": "chat" + }, + { + "id": "minimax-m2", + "name": "minimax-m2", + "display_name": "minimax-m2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-02-15", - "last_updated": "2026-02-17", + "release_date": "2025-10-23", + "last_updated": "2026-01-19", "type": "chat" }, { - "id": "glm-5", - "name": "glm-5", - "display_name": "glm-5", + "id": "deepseek-v4-pro", + "name": "deepseek-v4-pro", + "display_name": "deepseek-v4-pro", "modalities": { "input": [ "text" @@ -167814,8 +176620,8 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 1048576, + "output": 1048576 }, "tool_call": true, "reasoning": { @@ -167835,41 +176641,46 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "type": "chat" }, { - "id": "qwen3-vl:235b-instruct", - "name": "qwen3-vl:235b-instruct", - "display_name": "qwen3-vl:235b-instruct", + "id": "deepseek-v3.2", + "name": "deepseek-v3.2", + "display_name": "deepseek-v3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 163840, + "output": 65536 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": true, - "release_date": "2025-09-22", + "release_date": "2025-06-15", "last_updated": "2026-01-19", "type": "chat" }, { - "id": "minimax-m2", - "name": "minimax-m2", - "display_name": "minimax-m2", + "id": "minimax-m2.5", + "name": "minimax-m2.5", + "display_name": "minimax-m2.5", "modalities": { "input": [ "text" @@ -167880,11 +176691,12 @@ }, "limit": { "context": 204800, - "output": 128000 + "output": 131072 }, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -167893,14 +176705,15 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-10-23", - "last_updated": "2026-01-19", + "knowledge": "2025-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "type": "chat" }, { - "id": "minimax-m2.1", - "name": "minimax-m2.1", - "display_name": "minimax-m2.1", + "id": "glm-4.6", + "name": "glm-4.6", + "display_name": "glm-4.6", "modalities": { "input": [ "text" @@ -167910,7 +176723,7 @@ ] }, "limit": { - "context": 204800, + "context": 202752, "output": 131072 }, "tool_call": true, @@ -167925,14 +176738,14 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-23", + "release_date": "2025-09-29", "last_updated": "2026-01-19", "type": "chat" }, { - "id": "glm-5.1", - "name": "glm-5.1", - "display_name": "glm-5.1", + "id": "minimax-m2.7", + "name": "minimax-m2.7", + "display_name": "minimax-m2.7", "modalities": { "input": [ "text" @@ -167942,8 +176755,8 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 196608, + "output": 196608 }, "tool_call": true, "reasoning": { @@ -167963,14 +176776,53 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-04-07", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "type": "chat" }, { - "id": "mistral-large-3:675b", - "name": "mistral-large-3:675b", - "display_name": "mistral-large-3:675b", + "id": "kimi-k2-thinking", + "name": "kimi-k2-thinking", + "display_name": "kimi-k2-thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2026-01-19", + "type": "chat" + }, + { + "id": "qwen3-vl:235b-instruct", + "name": "qwen3-vl:235b-instruct", + "display_name": "qwen3-vl:235b-instruct", "modalities": { "input": [ "text", @@ -167982,7 +176834,7 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 131072 }, "tool_call": true, "reasoning": { @@ -167990,10 +176842,49 @@ }, "attachment": true, "open_weights": true, - "release_date": "2025-12-02", + "release_date": "2025-09-22", "last_updated": "2026-01-19", "type": "chat" }, + { + "id": "qwen3.5:397b", + "name": "qwen3.5:397b", + "display_name": "qwen3.5:397b", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-02-15", + "last_updated": "2026-02-17", + "type": "chat" + }, { "id": "deepseek-v4-flash", "name": "deepseek-v4-flash", @@ -168033,9 +176924,9 @@ "type": "chat" }, { - "id": "glm-4.6", - "name": "glm-4.6", - "display_name": "glm-4.6", + "id": "glm-4.7", + "name": "glm-4.7", + "display_name": "glm-4.7", "modalities": { "input": [ "text" @@ -168055,15 +176946,59 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2025-09-29", + "release_date": "2025-12-22", "last_updated": "2026-01-19", "type": "chat" }, + { + "id": "glm-5", + "name": "glm-5", + "display_name": "glm-5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 202752, + "output": 131072 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "type": "chat" + }, { "id": "kimi-k2.6", "name": "kimi-k2.6", @@ -168098,154 +177033,13 @@ "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "deepseek-v4-pro", - "display_name": "deepseek-v4-pro", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1048576, - "output": 1048576 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-24", - "last_updated": "2026-04-24", - "type": "chat" - }, - { - "id": "minimax-m2.5", - "name": "minimax-m2.5", - "display_name": "minimax-m2.5", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 204800, - "output": 131072 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", - "type": "chat" - }, - { - "id": "deepseek-v3.2", - "name": "deepseek-v3.2", - "display_name": "deepseek-v3.2", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 163840, - "output": 65536 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-15", - "last_updated": "2026-01-19", - "type": "chat" - }, - { - "id": "kimi-k2-thinking", - "name": "kimi-k2-thinking", - "display_name": "kimi-k2-thinking", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 262144 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2026-01-19", - "type": "chat" - }, - { - "id": "kimi-k2:1t", - "name": "kimi-k2:1t", - "display_name": "kimi-k2:1t", + "id": "mistral-large-3:675b", + "name": "mistral-large-3:675b", + "display_name": "mistral-large-3:675b", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -168259,10 +177053,9 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-11", + "release_date": "2025-12-02", "last_updated": "2026-01-19", "type": "chat" } @@ -171998,7 +180791,7 @@ "default": true }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172022,7 +180815,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172046,7 +180839,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172070,7 +180863,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172095,7 +180888,7 @@ "supported": false }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172120,7 +180913,7 @@ "supported": false }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "embedding" }, { @@ -172145,7 +180938,7 @@ "supported": false }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "embedding" }, { @@ -172171,7 +180964,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172197,7 +180990,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172223,7 +181016,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172249,7 +181042,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172275,7 +181068,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172293,7 +181086,7 @@ }, "limit": { "context": 256000, - "output": 32000 + "output": 64000 }, "tool_call": true, "reasoning": { @@ -172301,7 +181094,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172327,7 +181120,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172353,7 +181146,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172379,7 +181172,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172405,7 +181198,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172431,7 +181224,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172457,7 +181250,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172481,7 +181274,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172507,7 +181300,7 @@ "default": true }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172531,7 +181324,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172552,7 +181345,7 @@ "supported": false }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z" + "last_updated": "2026-05-12T04:12:03Z" }, { "id": "doubao-seedance-1-0-pro-fast-251015", @@ -172572,7 +181365,7 @@ "supported": false }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z" + "last_updated": "2026-05-12T04:12:03Z" }, { "id": "doubao-seedance-1-5-pro-251215", @@ -172593,7 +181386,7 @@ "supported": false }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z" + "last_updated": "2026-05-12T04:12:03Z" }, { "id": "doubao-seedance-2-0-260128", @@ -172615,7 +181408,7 @@ "supported": false }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z" + "last_updated": "2026-05-12T04:12:03Z" }, { "id": "doubao-seedance-2-0-fast-260128", @@ -172637,7 +181430,7 @@ "supported": false }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z" + "last_updated": "2026-05-12T04:12:03Z" }, { "id": "doubao-seedream-4-0-250828", @@ -172653,7 +181446,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "imageGeneration" }, { @@ -172670,7 +181463,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "imageGeneration" }, { @@ -172691,7 +181484,7 @@ "supported": false }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "imageGeneration" }, { @@ -172711,7 +181504,7 @@ "supported": false }, "attachment": true, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "imageGeneration" }, { @@ -172731,7 +181524,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172756,7 +181549,7 @@ "default": true }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172776,7 +181569,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172796,7 +181589,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172816,7 +181609,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172836,7 +181629,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" }, { @@ -172856,7 +181649,7 @@ "supported": false }, "attachment": false, - "last_updated": "2026-05-11T03:12:48Z", + "last_updated": "2026-05-12T04:12:03Z", "type": "chat" } ] @@ -174195,6 +182988,58 @@ }, "type": "chat" }, + { + "id": "qwen/qwen3.6-35b-a3b", + "name": "Qwen3.6-35B-A3B", + "display_name": "Qwen3.6-35B-A3B", + "limit": { + "context": 262144, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, + { + "id": "qwen/qwen3.6-plus", + "name": "Qwen3.6-Plus", + "display_name": "Qwen3.6-Plus", + "limit": { + "context": 1000000, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, { "id": "xiaomimimo/mimo-v2-flash", "name": "XiaomiMiMo/MiMo-V2-Flash", @@ -174654,12 +183499,7 @@ }, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "type": "chat" }, @@ -179381,6 +188221,37 @@ }, "type": "chat" }, + { + "id": "gpt-5.5-pro", + "name": "gpt-5.5-pro", + "display_name": "gpt-5.5-pro", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 1050000, + "output": 1050000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "cost": { + "input": 30, + "output": 180, + "cache_read": 30 + }, + "type": "chat" + }, { "id": "deepseek-v4-flash", "name": "deepseek-v4-flash", @@ -180176,35 +189047,12 @@ "type": "imageGeneration" }, { - "id": "wan2.7-videoedit", - "name": "wan2.7-videoedit", - "display_name": "wan2.7-videoedit", - "modalities": { - "input": [ - "text", - "video" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 2, - "output": 0 - }, - "type": "chat" - }, - { - "id": "wan2.7-t2v", - "name": "wan2.7-t2v", - "display_name": "wan2.7-t2v", + "id": "wan2.7-i2v", + "name": "wan2.7-i2v", + "display_name": "wan2.7-i2v", "modalities": { "input": [ + "image", "text" ] }, @@ -180223,9 +189071,9 @@ "type": "chat" }, { - "id": "wan2.7-r2v", - "name": "wan2.7-r2v", - "display_name": "wan2.7-r2v", + "id": "wan2.7-videoedit", + "name": "wan2.7-videoedit", + "display_name": "wan2.7-videoedit", "modalities": { "input": [ "text", @@ -180247,12 +189095,11 @@ "type": "chat" }, { - "id": "wan2.7-i2v", - "name": "wan2.7-i2v", - "display_name": "wan2.7-i2v", + "id": "wan2.7-t2v", + "name": "wan2.7-t2v", + "display_name": "wan2.7-t2v", "modalities": { "input": [ - "image", "text" ] }, @@ -180271,9 +189118,33 @@ "type": "chat" }, { - "id": "wan2.7-image", - "name": "wan2.7-image", - "display_name": "wan2.7-image", + "id": "wan2.7-r2v", + "name": "wan2.7-r2v", + "display_name": "wan2.7-r2v", + "modalities": { + "input": [ + "text", + "video" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 2, + "output": 0 + }, + "type": "chat" + }, + { + "id": "wan2.7-image-pro", + "name": "wan2.7-image-pro", + "display_name": "wan2.7-image-pro", "modalities": { "input": [ "text", @@ -180296,9 +189167,9 @@ "type": "imageGeneration" }, { - "id": "wan2.7-image-pro", - "name": "wan2.7-image-pro", - "display_name": "wan2.7-image-pro", + "id": "wan2.7-image", + "name": "wan2.7-image", + "display_name": "wan2.7-image", "modalities": { "input": [ "text", @@ -181526,160 +190397,6 @@ }, "type": "chat" }, - { - "id": "tts-1", - "name": "tts-1", - "display_name": "tts-1", - "modalities": { - "input": [ - "text" - ], - "output": [ - "audio" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "cost": { - "input": 15, - "output": 15 - }, - "type": "tts" - }, - { - "id": "tts-1-hd", - "name": "tts-1-hd", - "display_name": "tts-1-hd", - "modalities": { - "input": [ - "text" - ], - "output": [ - "audio" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "cost": { - "input": 30, - "output": 30 - }, - "type": "tts" - }, - { - "id": "gpt-4o-mini-tts", - "name": "gpt-4o-mini-tts", - "display_name": "gpt-4o-mini-tts", - "modalities": { - "input": [ - "text" - ], - "output": [ - "audio" - ] - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "cost": { - "input": 0.48, - "output": 0.96 - }, - "type": "tts" - }, - { - "id": "gemini-2.5-flash-preview-tts", - "name": "gemini-2.5-flash-preview-tts", - "display_name": "gemini-2.5-flash-preview-tts", - "modalities": { - "input": [ - "text" - ], - "output": [ - "audio" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", - "cost": { - "input": 0.5, - "output": 0.5, - "cache_read": 0 - }, - "type": "tts" - }, - { - "id": "gemini-2.5-pro-preview-tts", - "name": "gemini-2.5-pro-preview-tts", - "display_name": "gemini-2.5-pro-preview-tts", - "modalities": { - "input": [ - "text" - ], - "output": [ - "audio" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", - "cost": { - "input": 0.5, - "output": 0.5, - "cache_read": 0 - }, - "type": "tts" - }, { "id": "doubao-seed-2-0-pro", "name": "doubao-seed-2-0-pro", @@ -182713,56 +191430,6 @@ }, "type": "chat" }, - { - "id": "web-gpt-image-2-vip", - "name": "web-gpt-image-2-vip", - "display_name": "web-gpt-image-2-vip", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 4, - "output": 8, - "cache_read": 0 - }, - "type": "imageGeneration" - }, - { - "id": "web-gpt-image-2", - "name": "web-gpt-image-2", - "display_name": "web-gpt-image-2", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 4, - "output": 8, - "cache_read": 0 - }, - "type": "imageGeneration" - }, { "id": "gpt-4.1-free", "name": "gpt-4.1-free", @@ -184265,31 +192932,6 @@ }, "type": "chat" }, - { - "id": "web-gpt-image-1.5", - "name": "web-gpt-image-1.5", - "display_name": "web-gpt-image-1.5", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 4, - "output": 8, - "cache_read": 0 - }, - "type": "imageGeneration" - }, { "id": "gpt-5", "name": "gpt-5", @@ -184367,35 +193009,6 @@ }, "type": "chat" }, - { - "id": "deepseek-v3.2-speciale", - "name": "deepseek-v3.2-speciale", - "display_name": "deepseek-v3.2-speciale", - "modalities": { - "input": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 128000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "cost": { - "input": 0.58, - "output": 1.680028 - }, - "type": "chat" - }, { "id": "deepseek-v3.2-think", "name": "deepseek-v3.2-think", @@ -184426,36 +193039,6 @@ }, "type": "chat" }, - { - "id": "deepseek-math-v2", - "name": "deepseek-math-v2", - "display_name": "deepseek-math-v2", - "modalities": { - "input": [ - "text" - ] - }, - "limit": { - "context": 163000, - "output": 163000 - }, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "cost": { - "input": 0.492, - "output": 1.968, - "cache_read": 0.0984 - }, - "type": "chat" - }, { "id": "gpt-5-codex", "name": "gpt-5-codex", @@ -185660,25 +194243,6 @@ }, "type": "chat" }, - { - "id": "web-sora-2", - "name": "web-sora-2", - "display_name": "web-sora-2", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 2, - "output": 2, - "cache_read": 2 - }, - "type": "chat" - }, { "id": "wan2.2-i2v-plus", "name": "wan2.2-i2v-plus", @@ -185773,25 +194337,6 @@ }, "type": "chat" }, - { - "id": "web-sora-2-pro", - "name": "web-sora-2-pro", - "display_name": "web-sora-2-pro", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 2, - "output": 2, - "cache_read": 2 - }, - "type": "chat" - }, { "id": "kimi-for-coding-free", "name": "kimi-for-coding-free", @@ -186355,29 +194900,6 @@ }, "type": "chat" }, - { - "id": "DeepSeek-V3.1-Fast", - "name": "DeepSeek-V3.1-Fast", - "display_name": "DeepSeek-V3.1-Fast", - "modalities": { - "input": [ - "text" - ] - }, - "limit": { - "context": 163000, - "output": 163000 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "cost": { - "input": 1.096, - "output": 3.288 - }, - "type": "chat" - }, { "id": "claude-opus-4-0", "name": "claude-opus-4-0", @@ -187237,62 +195759,6 @@ }, "type": "chat" }, - { - "id": "grok-4-fast-non-reasoning", - "name": "grok-4-fast-non-reasoning", - "display_name": "grok-4-fast-non-reasoning", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 2000000, - "output": 2000000 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 - }, - "type": "chat" - }, - { - "id": "grok-4-fast-reasoning", - "name": "grok-4-fast-reasoning", - "display_name": "grok-4-fast-reasoning", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 2000000, - "output": 2000000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 - }, - "type": "chat" - }, { "id": "kimi-k2-0711", "name": "kimi-k2-0711", @@ -187701,6 +196167,62 @@ }, "type": "chat" }, + { + "id": "grok-4-fast-non-reasoning", + "name": "grok-4-fast-non-reasoning", + "display_name": "grok-4-fast-non-reasoning", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 2000000, + "output": 2000000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + }, + "type": "chat" + }, + { + "id": "grok-4-fast-reasoning", + "name": "grok-4-fast-reasoning", + "display_name": "grok-4-fast-reasoning", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 2000000, + "output": 2000000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + }, + "type": "chat" + }, { "id": "DeepSeek-OCR", "name": "DeepSeek-OCR", @@ -187744,9 +196266,9 @@ "type": "chat" }, { - "id": "veo-3.1-fast-generate-preview", - "name": "veo-3.1-fast-generate-preview", - "display_name": "veo-3.1-fast-generate-preview", + "id": "veo-3.1-generate-preview", + "name": "veo-3.1-generate-preview", + "display_name": "veo-3.1-generate-preview", "modalities": { "input": [ "text", @@ -187764,14 +196286,15 @@ }, "cost": { "input": 2, - "output": 0 + "output": 2, + "cache_read": 0 }, "type": "chat" }, { - "id": "veo-3.1-generate-preview", - "name": "veo-3.1-generate-preview", - "display_name": "veo-3.1-generate-preview", + "id": "veo-3.1-fast-generate-preview", + "name": "veo-3.1-fast-generate-preview", + "display_name": "veo-3.1-fast-generate-preview", "modalities": { "input": [ "text", @@ -187789,8 +196312,7 @@ }, "cost": { "input": 2, - "output": 2, - "cache_read": 0 + "output": 0 }, "type": "chat" }, @@ -190795,31 +199317,6 @@ }, "type": "chat" }, - { - "id": "gpt-4o-image-vip", - "name": "gpt-4o-image-vip", - "display_name": "gpt-4o-image-vip", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 4, - "output": 16, - "cache_read": 0 - }, - "type": "imageGeneration" - }, { "id": "Doubao-1.5-thinking-pro", "name": "Doubao-1.5-thinking-pro", @@ -190880,31 +199377,6 @@ }, "type": "chat" }, - { - "id": "gpt-4o-image", - "name": "gpt-4o-image", - "display_name": "gpt-4o-image", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 4, - "output": 16, - "cache_read": 0 - }, - "type": "imageGeneration" - }, { "id": "gemma-3-1b-it", "name": "gemma-3-1b-it", @@ -191292,82 +199764,6 @@ }, "type": "chat" }, - { - "id": "ERNIE-X1.1-Preview", - "name": "ERNIE-X1.1-Preview", - "display_name": "ERNIE-X1.1-Preview", - "modalities": { - "input": [ - "text" - ] - }, - "limit": { - "context": 119000, - "output": 119000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "cost": { - "input": 0.136, - "output": 0.544 - }, - "type": "chat" - }, - { - "id": "Qwen/QwQ-32B", - "name": "Qwen/QwQ-32B", - "display_name": "Qwen/QwQ-32B", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": true, - "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "cost": { - "input": 0.14, - "output": 0.56 - }, - "type": "chat" - }, - { - "id": "chutesai/Mistral-Small-3.1-24B-Instruct-2503", - "name": "chutesai/Mistral-Small-3.1-24B-Instruct-2503", - "display_name": "chutesai/Mistral-Small-3.1-24B-Instruct-2503", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.2, - "output": 0.8 - }, - "type": "chat" - }, { "id": "minimax-m2", "name": "minimax-m2", @@ -191398,96 +199794,17 @@ "type": "chat" }, { - "id": "kat-dev", - "name": "kat-dev", - "display_name": "kat-dev", - "modalities": { - "input": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 128000 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.137, - "output": 0.548 - }, - "type": "chat" - }, - { - "id": "llama-3.3-70b", - "name": "llama-3.3-70b", - "display_name": "llama-3.3-70b", - "limit": { - "context": 65536, - "output": 65536 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.6, - "output": 0.6 - }, - "type": "chat" - }, - { - "id": "moonshotai/Kimi-Dev-72B", - "name": "moonshotai/Kimi-Dev-72B", - "display_name": "moonshotai/Kimi-Dev-72B", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.32, - "output": 1.28, - "cache_read": 0 - }, - "type": "chat" - }, - { - "id": "moonshotai/Moonlight-16B-A3B-Instruct", - "name": "moonshotai/Moonlight-16B-A3B-Instruct", - "display_name": "moonshotai/Moonlight-16B-A3B-Instruct", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.2, - "output": 0.2, - "cache_read": 0 - }, - "type": "chat" - }, - { - "id": "nvidia-nemotron-3-super-120b-a12b", - "name": "nvidia-nemotron-3-super-120b-a12b", - "display_name": "nvidia-nemotron-3-super-120b-a12b", + "id": "ERNIE-X1.1-Preview", + "name": "ERNIE-X1.1-Preview", + "display_name": "ERNIE-X1.1-Preview", "modalities": { "input": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 119000, + "output": 119000 }, "tool_call": true, "reasoning": { @@ -191500,50 +199817,44 @@ } }, "cost": { - "input": 0.11, - "output": 0.55, - "cache_read": 0.0275 + "input": 0.136, + "output": 0.544 }, "type": "chat" }, { - "id": "o1-global", - "name": "o1-global", - "display_name": "o1-global", + "id": "Qwen/QwQ-32B", + "name": "Qwen/QwQ-32B", + "display_name": "Qwen/QwQ-32B", "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.14, + "output": 0.56 }, "type": "chat" }, { - "id": "qianfan-qi-vl", - "name": "qianfan-qi-vl", - "display_name": "qianfan-qi-vl", + "id": "chutesai/Mistral-Small-3.1-24B-Instruct-2503", + "name": "chutesai/Mistral-Small-3.1-24B-Instruct-2503", + "display_name": "chutesai/Mistral-Small-3.1-24B-Instruct-2503", "limit": { "context": 8192, "output": 8192 @@ -191554,49 +199865,7 @@ }, "cost": { "input": 0.2, - "output": 0.6 - }, - "type": "chat" - }, - { - "id": "qwen2.5-vl-72b-instruct", - "name": "qwen2.5-vl-72b-instruct", - "display_name": "qwen2.5-vl-72b-instruct", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 2.4, - "output": 7.2 - }, - "type": "chat" - }, - { - "id": "tencent/Hunyuan-A13B-Instruct", - "name": "tencent/Hunyuan-A13B-Instruct", - "display_name": "tencent/Hunyuan-A13B-Instruct", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.14, - "output": 0.56 + "output": 0.8 }, "type": "chat" }, @@ -191855,9 +200124,69 @@ "type": "chat" }, { - "id": "unsloth/gemma-3-12b-it", - "name": "unsloth/gemma-3-12b-it", - "display_name": "unsloth/gemma-3-12b-it", + "id": "kat-dev", + "name": "kat-dev", + "display_name": "kat-dev", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.137, + "output": 0.548 + }, + "type": "chat" + }, + { + "id": "llama-3.3-70b", + "name": "llama-3.3-70b", + "display_name": "llama-3.3-70b", + "limit": { + "context": 65536, + "output": 65536 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.6, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "moonshotai/Kimi-Dev-72B", + "name": "moonshotai/Kimi-Dev-72B", + "display_name": "moonshotai/Kimi-Dev-72B", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.32, + "output": 1.28, + "cache_read": 0 + }, + "type": "chat" + }, + { + "id": "moonshotai/Moonlight-16B-A3B-Instruct", + "name": "moonshotai/Moonlight-16B-A3B-Instruct", + "display_name": "moonshotai/Moonlight-16B-A3B-Instruct", "limit": { "context": 8192, "output": 8192 @@ -191868,11 +200197,135 @@ }, "cost": { "input": 0.2, - "output": 0.8, + "output": 0.2, "cache_read": 0 }, "type": "chat" }, + { + "id": "nvidia-nemotron-3-super-120b-a12b", + "name": "nvidia-nemotron-3-super-120b-a12b", + "display_name": "nvidia-nemotron-3-super-120b-a12b", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 1000000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "cost": { + "input": 0.11, + "output": 0.55, + "cache_read": 0.0275 + }, + "type": "chat" + }, + { + "id": "o1-global", + "name": "o1-global", + "display_name": "o1-global", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "cost": { + "input": 15, + "output": 60, + "cache_read": 7.5 + }, + "type": "chat" + }, + { + "id": "qianfan-qi-vl", + "name": "qianfan-qi-vl", + "display_name": "qianfan-qi-vl", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.2, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "qwen2.5-vl-72b-instruct", + "name": "qwen2.5-vl-72b-instruct", + "display_name": "qwen2.5-vl-72b-instruct", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 2.4, + "output": 7.2 + }, + "type": "chat" + }, + { + "id": "tencent/Hunyuan-A13B-Instruct", + "name": "tencent/Hunyuan-A13B-Instruct", + "display_name": "tencent/Hunyuan-A13B-Instruct", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.14, + "output": 0.56 + }, + "type": "chat" + }, { "id": "qwen-qwq-32b", "name": "qwen-qwq-32b", @@ -191934,26 +200387,21 @@ "type": "chat" }, { - "id": "claude-3-5-haiku", - "name": "claude-3-5-haiku", - "display_name": "claude-3-5-haiku", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "unsloth/gemma-3-12b-it", + "name": "unsloth/gemma-3-12b-it", + "display_name": "unsloth/gemma-3-12b-it", "limit": { - "context": 200000, - "output": 200000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 1.1, - "output": 5.5 + "input": 0.2, + "output": 0.8, + "cache_read": 0 }, "type": "chat" }, @@ -191976,20 +200424,26 @@ "type": "chat" }, { - "id": "tencent/Hunyuan-MT-7B", - "name": "tencent/Hunyuan-MT-7B", - "display_name": "tencent/Hunyuan-MT-7B", + "id": "claude-3-5-haiku", + "name": "claude-3-5-haiku", + "display_name": "claude-3-5-haiku", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 200000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.2, - "output": 0.2 + "input": 1.1, + "output": 5.5 }, "type": "chat" }, @@ -192065,6 +200519,24 @@ }, "type": "rerank" }, + { + "id": "tencent/Hunyuan-MT-7B", + "name": "tencent/Hunyuan-MT-7B", + "display_name": "tencent/Hunyuan-MT-7B", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.2, + "output": 0.2 + }, + "type": "chat" + }, { "id": "gemini-2.0-flash-lite-preview-02-05", "name": "gemini-2.0-flash-lite-preview-02-05", @@ -193757,68 +202229,6 @@ }, "type": "chat" }, - { - "id": "grok-4.20-beta-0309-non-reasoning", - "name": "grok-4.20-beta-0309-non-reasoning", - "display_name": "grok-4.20-beta-0309-non-reasoning", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 2000000, - "output": 2000000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2 - }, - "type": "chat" - }, - { - "id": "grok-4.20-beta-0309-reasoning", - "name": "grok-4.20-beta-0309-reasoning", - "display_name": "grok-4.20-beta-0309-reasoning", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 2000000, - "output": 2000000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2 - }, - "type": "chat" - }, { "id": "grok-4.20-multi-agent-beta-0309", "name": "grok-4.20-multi-agent-beta-0309", @@ -193988,6 +202398,68 @@ }, "type": "chat" }, + { + "id": "grok-4.20-beta-0309-non-reasoning", + "name": "grok-4.20-beta-0309-non-reasoning", + "display_name": "grok-4.20-beta-0309-non-reasoning", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 2000000, + "output": 2000000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "cost": { + "input": 2, + "output": 6, + "cache_read": 0.2 + }, + "type": "chat" + }, + { + "id": "grok-4.20-beta-0309-reasoning", + "name": "grok-4.20-beta-0309-reasoning", + "display_name": "grok-4.20-beta-0309-reasoning", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 2000000, + "output": 2000000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "cost": { + "input": 2, + "output": 6, + "cache_read": 0.2 + }, + "type": "chat" + }, { "id": "DESCRIBE", "name": "DESCRIBE", @@ -198709,6 +207181,60 @@ }, "type": "chat" }, + { + "id": "text-moderation-latest", + "name": "text-moderation-latest", + "display_name": "text-moderation-latest", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.2, + "output": 0.2 + }, + "type": "chat" + }, + { + "id": "text-moderation-stable", + "name": "text-moderation-stable", + "display_name": "text-moderation-stable", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.2, + "output": 0.2 + }, + "type": "chat" + }, + { + "id": "text-search-ada-doc-001", + "name": "text-search-ada-doc-001", + "display_name": "text-search-ada-doc-001", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 20, + "output": 20 + }, + "type": "chat" + }, { "id": "veo3", "name": "veo3", @@ -198737,12 +207263,15 @@ "type": "chat" }, { - "id": "tts-1-hd-1106", - "name": "tts-1-hd-1106", - "display_name": "tts-1-hd-1106", + "id": "veo-3", + "name": "veo-3", + "display_name": "veo-3", "modalities": { "input": [ - "audio" + "text", + "image", + "audio", + "video" ] }, "limit": { @@ -198754,9 +207283,11 @@ "supported": false }, "cost": { - "input": 30, - "output": 30 - } + "input": 2, + "output": 2, + "cache_read": 0 + }, + "type": "chat" }, { "id": "whisper-1", @@ -198828,9 +207359,9 @@ "type": "chat" }, { - "id": "tts-1-hd", - "name": "tts-1-hd", - "display_name": "tts-1-hd", + "id": "tts-1-hd-1106", + "name": "tts-1-hd-1106", + "display_name": "tts-1-hd-1106", "modalities": { "input": [ "audio" @@ -198850,9 +207381,9 @@ } }, { - "id": "tts-1-1106", - "name": "tts-1-1106", - "display_name": "tts-1-1106", + "id": "tts-1-hd", + "name": "tts-1-hd", + "display_name": "tts-1-hd", "modalities": { "input": [ "audio" @@ -198867,14 +207398,14 @@ "supported": false }, "cost": { - "input": 15, - "output": 15 + "input": 30, + "output": 30 } }, { - "id": "tts-1", - "name": "tts-1", - "display_name": "tts-1", + "id": "tts-1-1106", + "name": "tts-1-1106", + "display_name": "tts-1-1106", "modalities": { "input": [ "audio" @@ -198893,69 +207424,6 @@ "output": 15 } }, - { - "id": "veo-3", - "name": "veo-3", - "display_name": "veo-3", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 2, - "output": 2, - "cache_read": 0 - }, - "type": "chat" - }, - { - "id": "text-search-ada-doc-001", - "name": "text-search-ada-doc-001", - "display_name": "text-search-ada-doc-001", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 20, - "output": 20 - }, - "type": "chat" - }, - { - "id": "text-moderation-stable", - "name": "text-moderation-stable", - "display_name": "text-moderation-stable", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" - }, { "id": "yi-large", "name": "yi-large", @@ -199065,9 +207533,14 @@ "type": "chat" }, { - "id": "text-moderation-latest", - "name": "text-moderation-latest", - "display_name": "text-moderation-latest", + "id": "tts-1", + "name": "tts-1", + "display_name": "tts-1", + "modalities": { + "input": [ + "audio" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -199077,10 +207550,9 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" + "input": 15, + "output": 15 + } }, { "id": "aistudio_gemini-2.0-flash", @@ -199765,8 +208237,8 @@ "display_name": "Anthropic: Claude Haiku 4.5", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" @@ -199781,6 +208253,7 @@ "supported": true, "default": true }, + "attachment": true, "type": "imageGeneration" }, { @@ -199906,6 +208379,7 @@ ] } }, + "attachment": true, "type": "imageGeneration" }, { @@ -199956,157 +208430,209 @@ ] } }, - "type": "imageGeneration" - }, - { - "id": "anthropic/claude-opus-4.7", - "name": "Anthropic: Claude Opus 4.7", - "display_name": "Anthropic: Claude Opus 4.7", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 128000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "interleaved": true, - "summaries": true, - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } - }, - "type": "imageGeneration" - }, - { - "id": "anthropic/claude-sonnet-4", - "name": "Anthropic: Claude Sonnet 4", - "display_name": "Anthropic: Claude Sonnet 4", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 64000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, "attachment": true, "type": "imageGeneration" }, - { - "id": "anthropic/claude-sonnet-4.5", - "name": "Anthropic: Claude Sonnet 4.5", - "display_name": "Anthropic: Claude Sonnet 4.5", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 64000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "type": "imageGeneration" - }, - { - "id": "anthropic/claude-sonnet-4.6", - "name": "Anthropic: Claude Sonnet 4.6", - "display_name": "Anthropic: Claude Sonnet 4.6", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 128000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." - ] - } - }, - "type": "imageGeneration" - }, + { + "id": "anthropic/claude-opus-4.7", + "name": "Anthropic: Claude Opus 4.7", + "display_name": "Anthropic: Claude Opus 4.7", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, + "type": "imageGeneration" + }, + { + "id": "anthropic/claude-opus-4.7-fast", + "name": "Anthropic: Claude Opus 4.7 (Fast)", + "display_name": "Anthropic: Claude Opus 4.7 (Fast)", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "interleaved": true, + "summaries": true, + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 requires thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, + "type": "imageGeneration" + }, + { + "id": "anthropic/claude-sonnet-4", + "name": "Anthropic: Claude Sonnet 4", + "display_name": "Anthropic: Claude Sonnet 4", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 64000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "type": "imageGeneration" + }, + { + "id": "anthropic/claude-sonnet-4.5", + "name": "Anthropic: Claude Sonnet 4.5", + "display_name": "Anthropic: Claude Sonnet 4.5", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "type": "imageGeneration" + }, + { + "id": "anthropic/claude-sonnet-4.6", + "name": "Anthropic: Claude Sonnet 4.6", + "display_name": "Anthropic: Claude Sonnet 4.6", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path." + ] + } + }, + "attachment": true, + "type": "imageGeneration" + }, { "id": "arcee-ai/coder-large", "name": "Arcee AI: Coder Large", @@ -200432,9 +208958,9 @@ "type": "imageGeneration" }, { - "id": "baidu/qianfan-ocr-fast:free", - "name": "Baidu: Qianfan-OCR-Fast (free)", - "display_name": "Baidu: Qianfan-OCR-Fast (free)", + "id": "baidu/qianfan-ocr-fast", + "name": "Baidu: Qianfan-OCR-Fast", + "display_name": "Baidu: Qianfan-OCR-Fast", "modalities": { "input": [ "image", @@ -200995,11 +209521,6 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "type": "chat" }, { @@ -201015,8 +209536,8 @@ ] }, "limit": { - "context": 1048576, - "output": 384000 + "context": 1048575, + "output": 1048575 }, "tool_call": true, "reasoning": { @@ -201036,6 +209557,29 @@ }, "type": "chat" }, + { + "id": "deepseek/deepseek-v4-flash:free", + "name": "DeepSeek: DeepSeek V4 Flash (free)", + "display_name": "DeepSeek: DeepSeek V4 Flash (free)", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 384000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, { "id": "deepseek/deepseek-v4-pro", "name": "DeepSeek: DeepSeek V4 Pro", @@ -202115,9 +210659,9 @@ "type": "chat" }, { - "id": "inclusionai/ring-2.6-1t:free", - "name": "inclusionAI: Ring-2.6-1T (free)", - "display_name": "inclusionAI: Ring-2.6-1T (free)", + "id": "inclusionai/ring-2.6-1t", + "name": "inclusionAI: Ring-2.6-1T", + "display_name": "inclusionAI: Ring-2.6-1T", "modalities": { "input": [ "text" @@ -202907,6 +211451,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "chat" }, { @@ -202930,6 +211475,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "chat" }, { @@ -202953,6 +211499,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "chat" }, { @@ -202976,6 +211523,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "chat" }, { @@ -203094,6 +211642,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "chat" }, { @@ -203117,6 +211666,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "chat" }, { @@ -203140,6 +211690,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "chat" }, { @@ -203164,6 +211715,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "imageGeneration" }, { @@ -203188,6 +211740,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "imageGeneration" }, { @@ -203212,6 +211765,7 @@ "supported": true, "default": true }, + "attachment": true, "type": "imageGeneration" }, { @@ -203236,6 +211790,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "imageGeneration" }, { @@ -203282,6 +211837,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "chat" }, { @@ -203400,6 +211956,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "chat" }, { @@ -203424,6 +211981,7 @@ "reasoning": { "supported": false }, + "attachment": true, "type": "imageGeneration" }, { @@ -203447,7 +212005,8 @@ "tool_call": true, "reasoning": { "supported": false - } + }, + "attachment": true }, { "id": "moonshotai/kimi-k2", @@ -203576,8 +212135,8 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 262142, + "output": 262142 }, "tool_call": true, "reasoning": { @@ -205564,6 +214123,11 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "type": "imageGeneration" }, @@ -206283,6 +214847,31 @@ }, "type": "chat" }, + { + "id": "perceptron/perceptron-mk1", + "name": "Perceptron: Perceptron Mk1", + "display_name": "Perceptron: Perceptron Mk1", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32768, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "type": "imageGeneration" + }, { "id": "perplexity/sonar", "name": "Perplexity: Sonar", @@ -206537,28 +215126,6 @@ }, "type": "chat" }, - { - "id": "qwen/qwen-max", - "name": "Qwen: Qwen-Max", - "display_name": "Qwen: Qwen-Max", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32768, - "output": 8192 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "type": "chat" - }, { "id": "qwen/qwen-plus", "name": "Qwen: Qwen-Plus", @@ -206593,42 +215160,9 @@ "type": "chat" }, { - "id": "qwen/qwen-plus-2025-07-28", - "name": "Qwen: Qwen Plus 0728", - "display_name": "Qwen: Qwen Plus 0728", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 32768 - }, - "tool_call": true, - "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "type": "chat" - }, - { - "id": "qwen/qwen-plus-2025-07-28:thinking", - "name": "Qwen: Qwen Plus 0728 (thinking)", - "display_name": "Qwen: Qwen Plus 0728 (thinking)", + "id": "qwen/qwen-plus-2025-07-28", + "name": "Qwen: Qwen Plus 0728", + "display_name": "Qwen: Qwen Plus 0728", "modalities": { "input": [ "text" @@ -206642,29 +215176,6 @@ "output": 32768 }, "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "type": "chat" - }, - { - "id": "qwen/qwen-turbo", - "name": "Qwen: Qwen-Turbo", - "display_name": "Qwen: Qwen-Turbo", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 - }, - "tool_call": true, "reasoning": { "supported": true }, @@ -206682,50 +215193,27 @@ "type": "chat" }, { - "id": "qwen/qwen-vl-max", - "name": "Qwen: Qwen VL Max", - "display_name": "Qwen: Qwen VL Max", + "id": "qwen/qwen-plus-2025-07-28:thinking", + "name": "Qwen: Qwen Plus 0728 (thinking)", + "display_name": "Qwen: Qwen Plus 0728 (thinking)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 1000000, "output": 32768 }, "tool_call": true, "reasoning": { - "supported": false - }, - "type": "imageGeneration" - }, - { - "id": "qwen/qwen-vl-plus", - "name": "Qwen: Qwen VL Plus", - "display_name": "Qwen: Qwen VL Plus", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "imageGeneration" + "type": "chat" }, { "id": "qwen/qwen2.5-vl-72b-instruct", @@ -208436,177 +216924,6 @@ }, "type": "chat" }, - { - "id": "x-ai/grok-3", - "name": "xAI: Grok 3", - "display_name": "xAI: Grok 3", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131072 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "type": "chat" - }, - { - "id": "x-ai/grok-3-beta", - "name": "xAI: Grok 3 Beta", - "display_name": "xAI: Grok 3 Beta", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131072 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "type": "chat" - }, - { - "id": "x-ai/grok-3-mini", - "name": "xAI: Grok 3 Mini", - "display_name": "xAI: Grok 3 Mini", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131072 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "type": "chat" - }, - { - "id": "x-ai/grok-3-mini-beta", - "name": "xAI: Grok 3 Mini Beta", - "display_name": "xAI: Grok 3 Mini Beta", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131072 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "type": "chat" - }, - { - "id": "x-ai/grok-4", - "name": "xAI: Grok 4", - "display_name": "xAI: Grok 4", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 256000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, - "type": "imageGeneration" - }, - { - "id": "x-ai/grok-4-fast", - "name": "xAI: Grok 4 Fast", - "display_name": "xAI: Grok 4 Fast", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 2000000, - "output": 30000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "type": "imageGeneration" - }, - { - "id": "x-ai/grok-4.1-fast", - "name": "xAI: Grok 4.1 Fast", - "display_name": "xAI: Grok 4.1 Fast", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 2000000, - "output": 30000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "type": "imageGeneration" - }, { "id": "x-ai/grok-4.20", "name": "xAI: Grok 4.20", @@ -208686,34 +217003,6 @@ }, "type": "imageGeneration" }, - { - "id": "x-ai/grok-code-fast-1", - "name": "xAI: Grok Code Fast 1", - "display_name": "xAI: Grok Code Fast 1", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 10000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "type": "chat" - }, { "id": "xiaomi/mimo-v2-flash", "name": "Xiaomi: MiMo-V2-Flash", @@ -208972,8 +217261,8 @@ ] }, "limit": { - "context": 204800, - "output": 204800 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -209696,6 +217985,74 @@ }, "type": "chat" }, + { + "id": "deepseek/deepseek-v4-flash", + "name": "Deepseek V4 Flash", + "display_name": "Deepseek V4 Flash", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 393216 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, + { + "id": "deepseek/deepseek-v4-pro", + "name": "Deepseek V4 Pro", + "display_name": "Deepseek V4 Pro", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 393216 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, { "id": "deepseek/deepseek-ocr-2", "name": "DeepSeek-OCR 2", @@ -210512,6 +218869,87 @@ }, "type": "chat" }, + { + "id": "zai-org/glm-5-turbo", + "name": "GLM-5-Turbo", + "display_name": "GLM-5-Turbo", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 202800, + "output": 131072 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "type": "chat" + }, + { + "id": "zai-org/glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "type": "chat" + }, + { + "id": "zai-org/glm-5v-turbo", + "name": "GLM-5V-Turbo", + "display_name": "GLM-5V-Turbo", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, { "id": "zai-org/glm-ocr", "name": "GLM-OCR", @@ -211548,6 +219986,30 @@ }, "type": "chat" }, + { + "id": "gpt-5.5-light", + "name": "gpt-5.5-light", + "display_name": "gpt-5.5-light", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1050000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, { "id": "gpt-5.5-pro", "name": "gpt-5.5-pro", @@ -211570,6 +220032,11 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "type": "chat" }, { @@ -211967,6 +220434,28 @@ }, "type": "chat" }, + { + "id": "inclusionai/ling-2.6-flash", + "name": "Ling-2.6-flash", + "display_name": "Ling-2.6-flash", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, { "id": "meta-llama/llama-3.1-8b-instruct", "name": "Llama 3.1 8B Instruct", @@ -212158,6 +220647,102 @@ }, "type": "chat" }, + { + "id": "minimax/minimax-m2.5-highspeed", + "name": "MiniMax M2.5-highspeed", + "display_name": "MiniMax M2.5-highspeed", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131100 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "type": "chat" + }, + { + "id": "minimax/minimax-m2.7", + "name": "MiniMax M2.7", + "display_name": "MiniMax M2.7", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131100 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, + { + "id": "minimax/minimax-m2.7-highspeed", + "name": "MiniMax M2.7-highspeed", + "display_name": "MiniMax M2.7-highspeed", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, { "id": "mistralai/mistral-7b-instruct", "name": "Mistral 7B Instruct", @@ -212772,6 +221357,209 @@ }, "type": "chat" }, + { + "id": "qwen/qwen3.5-122b-a10b", + "name": "Qwen3.5-122B-A10B", + "display_name": "Qwen3.5-122B-A10B", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65500 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, + { + "id": "qwen/qwen3.5-27b", + "name": "Qwen3.5-27B", + "display_name": "Qwen3.5-27B", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65500 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, + { + "id": "qwen/qwen3.5-35b-a3b", + "name": "Qwen3.5-35B-A3B", + "display_name": "Qwen3.5-35B-A3B", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65500 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, + { + "id": "qwen/qwen3.5-397b-a17b", + "name": "Qwen3.5-397B-A17B", + "display_name": "Qwen3.5-397B-A17B", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 64000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, + { + "id": "qwen/qwen3.5-plus", + "name": "Qwen3.5-Plus", + "display_name": "Qwen3.5-Plus", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 64000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "type": "chat" + }, + { + "id": "inclusionai/ring-2.6-1t", + "name": "Ring-2.6-1T", + "display_name": "Ring-2.6-1T", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, { "id": "sao10k/l3-8b-lunaris", "name": "Sao10k L3 8B Lunaris", @@ -212816,6 +221604,29 @@ "default": true }, "type": "chat" + }, + { + "id": "xiaomimimo/mimo-v2.5-pro", + "name": "XiaomiMiMo/MiMo-V2.5-Pro", + "display_name": "XiaomiMiMo/MiMo-V2.5-Pro", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 131072 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" } ] }, @@ -212848,7 +221659,6 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-07-31", "release_date": "2024-10-22", "last_updated": "2024-10-22", "cost": { @@ -212879,11 +221689,11 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-01-01", "release_date": "2025-10-15", "last_updated": "2025-10-15", "cost": { @@ -212901,7 +221711,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -212937,7 +221748,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -212972,8 +221784,8 @@ "display_name": "Anthropic: Claude Opus 4.5", "modalities": { "input": [ - "pdf", "image", + "pdf", "text" ], "output": [ @@ -212992,9 +221804,8 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-01-01", "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "last_updated": "2026-03-15", "cost": { "input": 5, "output": 25, @@ -213068,16 +221879,14 @@ "display_name": "Anthropic: Claude Opus 4.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 409600, "output": 128000 }, "temperature": false, @@ -213116,10 +221925,9 @@ "release_date": "2026-04-16", "last_updated": "2026-04-16", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 4.5, + "output": 22.5, + "cache_read": 0.45 }, "type": "chat" }, @@ -213130,7 +221938,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -213165,15 +221974,16 @@ "display_name": "Anthropic: Claude Sonnet 4.5", "modalities": { "input": [ - "text", - "image" + "image", + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 1000000, "output": 64000 }, "temperature": true, @@ -213184,9 +221994,8 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "last_updated": "2026-03-15", "cost": { "input": 3, "output": 15, @@ -213570,8 +222379,9 @@ }, "limit": { "context": 163840, - "output": 163840 + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -213588,6 +222398,16 @@ ] } }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", + "cost": { + "input": 0.7, + "output": 2.5, + "cache_read": 0.35 + }, "type": "chat" }, { @@ -213603,14 +222423,23 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 32768, + "output": 7168 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "cost": { + "input": 0.15, + "output": 0.75 + }, "type": "chat" }, { @@ -213662,8 +222491,8 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, @@ -213707,8 +222536,8 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, @@ -213733,9 +222562,9 @@ "release_date": "2026-04-24", "last_updated": "2026-04-24", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 1.69, + "output": 3.38, + "cache_read": 0.13 }, "type": "chat" }, @@ -213761,14 +222590,13 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "open_weights": true, + "release_date": "2024-12-01", + "last_updated": "2026-03-15", "cost": { - "input": 0.28, - "output": 0.42, - "cache_read": 0.03 + "input": 0.32, + "output": 0.89, + "cache_read": 0.15 }, "type": "chat" }, @@ -213785,8 +222613,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -213805,14 +222633,15 @@ ] } }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "attachment": true, + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2025-12-01", + "last_updated": "2026-02-28", "cost": { - "input": 0.29, - "output": 0.43 + "input": 0.435, + "output": 0.87, + "cache_read": 0.028 }, "type": "chat" }, @@ -213829,8 +222658,8 @@ ] }, "limit": { - "context": 163000, - "output": 64000 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -213839,13 +222668,12 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", + "open_weights": true, "release_date": "2025-09-29", "last_updated": "2025-09-29", "cost": { - "input": 0.22, - "output": 0.33 + "input": 0.27, + "output": 0.41 }, "type": "chat" }, @@ -213898,12 +222726,13 @@ "attachment": true, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { "input": 0.3, "output": 2.5, - "cache_read": 0.03 + "cache_read": 0.075, + "cache_write": 0.55 }, "type": "chat" }, @@ -213913,9 +222742,11 @@ "display_name": "Google: Gemini 2.5 Flash Lite", "modalities": { "input": [ + "audio", "image", + "pdf", "text", - "audio" + "video" ], "output": [ "text" @@ -213952,16 +222783,15 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-07-22", - "last_updated": "2025-07-22", + "release_date": "2025-06-17", + "last_updated": "2026-03-15", "cost": { "input": 0.1, "output": 0.4, - "cache_read": 0.03, - "cache_write": 1 + "cache_read": 0.01, + "cache_write": 0.083333 }, - "type": "imageGeneration" + "type": "chat" }, { "id": "google/gemini-2.5-pro", @@ -214016,7 +222846,8 @@ "cost": { "input": 1.25, "output": 10, - "cache_read": 0.125 + "cache_read": 0.31, + "cache_write": 2.375 }, "type": "chat" }, @@ -214077,10 +222908,11 @@ "display_name": "Google: Gemini 3.1 Flash Lite", "modalities": { "input": [ - "text", + "audio", "image", - "video", - "audio" + "pdf", + "text", + "video" ], "output": [ "text" @@ -214090,7 +222922,7 @@ "context": 1048576, "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -214103,11 +222935,13 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-02-18", - "last_updated": "2026-02-18", + "release_date": "2026-05-07", + "last_updated": "2026-05-16", "cost": { "input": 0.25, - "output": 1.5 + "output": 1.5, + "cache_read": 0.025, + "cache_write": 0.08333 }, "type": "chat" }, @@ -214117,9 +222951,10 @@ "display_name": "Google: Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ - "text", - "image", "audio", + "image", + "pdf", + "text", "video" ], "output": [ @@ -214127,13 +222962,14 @@ ] }, "limit": { - "context": 1050000, - "output": 65530 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -214142,8 +222978,8 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-03-20", - "last_updated": "2025-03-20", + "release_date": "2026-03-03", + "last_updated": "2026-03-15", "cost": { "input": 0.25, "output": 1.5 @@ -214156,11 +222992,11 @@ "display_name": "Google: Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text", - "image", - "video", "audio", - "pdf" + "image", + "pdf", + "text", + "video" ], "output": [ "text" @@ -214195,13 +223031,11 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "last_updated": "2026-03-15", "cost": { "input": 2, - "output": 12, - "cache_read": 0.2 + "output": 12 }, "type": "chat" }, @@ -214229,7 +223063,6 @@ }, "attachment": true, "open_weights": true, - "knowledge": "2024-10", "release_date": "2025-03-13", "last_updated": "2025-03-13", "cost": { @@ -214313,75 +223146,13 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-21", - "last_updated": "2026-05-01", - "cost": { - "input": 0.08, - "output": 0.24, - "cache_read": 0.016 - }, - "type": "chat" - }, - { - "id": "inclusionai/ling-flash-2.0", - "name": "inclusionAI: Ling-flash-2.0", - "display_name": "inclusionAI: Ling-flash-2.0", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", - "cost": { - "input": 0.14, - "output": 0.57 - }, - "type": "chat" - }, - { - "id": "inclusionai/ling-mini-2.0", - "name": "inclusionAI: Ling-mini-2.0", - "display_name": "inclusionAI: Ling-mini-2.0", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-10", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.1, + "output": 0.3, + "cache_read": 0.02 }, "type": "chat" }, @@ -214453,52 +223224,8 @@ ] }, "limit": { - "context": 262000, - "output": 66000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-05-08", - "last_updated": "2026-05-08", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - }, - { - "id": "inclusionai/ring-flash-2.0", - "name": "inclusionAI: Ring-flash-2.0", - "display_name": "inclusionAI: Ring-flash-2.0", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -214506,41 +223233,14 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "release_date": "2026-05-08", + "last_updated": "2026-05-16", "cost": { - "input": 0.14, - "output": 0.57 - }, - "type": "chat" - }, - { - "id": "inclusionai/ring-mini-2.0", - "name": "inclusionAI: Ring-mini-2.0", - "display_name": "inclusionAI: Ring-mini-2.0", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131072 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true + "input": 0.075, + "output": 0.625, + "cache_read": 0.015 }, "type": "chat" }, @@ -214654,8 +223354,8 @@ ] }, "limit": { - "context": 204000, - "output": 64000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -214665,19 +223365,23 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", + "open_weights": true, "release_date": "2025-10-27", "last_updated": "2025-10-27", "cost": { "input": 0.3, "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.38 + "cache_read": 0.03 }, "type": "chat" }, @@ -214874,7 +223578,7 @@ }, "limit": { "context": 204800, - "output": 131070 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -214893,14 +223597,15 @@ ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2026-03-20", - "last_updated": "2026-03-20", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.611, - "output": 2.4439 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, @@ -214980,14 +223685,13 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-09-04", - "last_updated": "2025-09-04", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "output": 2.5 }, "type": "chat" }, @@ -215393,13 +224097,33 @@ "id": "openai/gpt-5-chat", "name": "OpenAI: GPT-5 Chat", "display_name": "OpenAI: GPT-5 Chat", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 272000, - "output": 16384 + "context": 400000, + "output": 128000 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.25, + "output": 10 }, "type": "chat" }, @@ -216000,6 +224724,8 @@ "display_name": "OpenAI: GPT-5.3 Chat", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -216008,18 +224734,16 @@ }, "limit": { "context": 128000, - "output": 16380 + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-20", - "last_updated": "2026-03-20", + "release_date": "2026-03-04", + "last_updated": "2026-03-15", "cost": { "input": 1.75, "output": 14 @@ -216032,7 +224756,9 @@ "display_name": "OpenAI: GPT-5.3-Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -216042,7 +224768,7 @@ "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -216072,11 +224798,12 @@ "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2026-03-20", - "last_updated": "2026-03-20", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { "input": 1.75, - "output": 14 + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, @@ -216087,7 +224814,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -216143,6 +224871,8 @@ "display_name": "OpenAI: GPT-5.4 Mini", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -216153,7 +224883,7 @@ "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -216183,12 +224913,12 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-20", - "last_updated": "2026-03-20", + "release_date": "2026-03-17", + "last_updated": "2026-04-11", "cost": { "input": 0.75, - "output": 4.5 + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, @@ -216198,6 +224928,8 @@ "display_name": "OpenAI: GPT-5.4 Nano", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -216208,7 +224940,7 @@ "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -216236,14 +224968,14 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-20", - "last_updated": "2026-03-20", + "release_date": "2026-03-17", + "last_updated": "2026-04-11", "cost": { "input": 0.2, - "output": 1.25 + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, @@ -216254,7 +224986,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -216264,7 +224997,7 @@ "context": 1050000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -216293,11 +225026,12 @@ "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2026-03-20", - "last_updated": "2026-03-20", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 45, - "output": 225 + "input": 30, + "output": 180, + "cache_read": 30 }, "type": "chat" }, @@ -216348,9 +225082,8 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "release_date": "2026-04-24", + "last_updated": "2026-05-01", "cost": { "input": 5, "output": 30, @@ -216382,11 +225115,15 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "release_date": "2026-04-24", + "last_updated": "2026-05-01", "cost": { "input": 30, "output": 180 @@ -216452,13 +225189,22 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 52429 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "attachment": false, + "open_weights": true, + "release_date": "2025-04", + "last_updated": "2026-01", + "cost": { + "input": 0.071, + "output": 0.1 + }, "type": "chat" }, { @@ -216474,8 +225220,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -216495,12 +225241,15 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.13, - "output": 0.6 + "input": 0.11, + "output": 0.6, + "cache_read": 0.055, + "cache_write": 0.22 }, "type": "chat" }, @@ -216517,13 +225266,14 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 40960, + "output": 40960 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -216537,12 +225287,13 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2025-04", + "last_updated": "2026-03-15", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.06, + "output": 0.24, + "cache_read": 0.025 }, "type": "chat" }, @@ -216560,12 +225311,21 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 66536 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "cost": { + "input": 0.3, + "output": 1.2 }, "type": "chat" }, @@ -216582,24 +225342,22 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 1000000, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": true, + "release_date": "2025-07-01", + "last_updated": "2026-03-15", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.65, + "output": 3.25, + "cache_read": 0.2 }, "type": "chat" }, @@ -216616,8 +225374,8 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -216637,12 +225395,12 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2026-01-23", - "last_updated": "2026-01-23", + "knowledge": "2025-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 1.2, - "output": 6 + "input": 2.11, + "output": 8.45 }, "type": "chat" }, @@ -216733,7 +225491,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" @@ -216741,7 +225500,7 @@ }, "limit": { "context": 1000000, - "output": 64000 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -216760,14 +225519,14 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2026-03-20", - "last_updated": "2026-03-20", + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.8, - "output": 4.8 + "input": 0.115, + "output": 0.688 }, "type": "chat" }, @@ -216867,6 +225626,7 @@ "display_name": "Qwen: Qwen3.6-Plus", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -216875,7 +225635,7 @@ }, "limit": { "context": 1000000, - "output": 64000 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -216894,15 +225654,15 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-30", - "last_updated": "2026-03-30", + "release_date": "2025-08-26", + "last_updated": "2026-04-11", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "cache_write": 0.625 + "input": 0.325, + "output": 1.95, + "cache_read": 0.0325, + "cache_write": 0.40625 }, "type": "chat" }, @@ -217012,21 +225772,22 @@ }, "limit": { "context": 256000, - "output": 64000 + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2026-02-02", - "last_updated": "2026-02-02", + "open_weights": true, + "release_date": "2026-01-29", + "last_updated": "2026-01-29", "cost": { "input": 0.1, - "output": 0.3 + "output": 0.3, + "cache_read": 0.02 }, "type": "chat" }, @@ -217122,42 +225883,8 @@ ] }, "limit": { - "context": 256000, - "output": 64000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-20", - "last_updated": "2026-04-20", - "cost": { - "input": 0.172, - "output": 0.572, - "cache_read": 0.058, - "cache_write": 0 - }, - "type": "chat" - }, - { - "id": "x-ai/grok-4", - "name": "xAI: Grok 4", - "display_name": "xAI: Grok 4", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -217165,152 +225892,14 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 - }, - "type": "chat" - }, - { - "id": "x-ai/grok-4-fast", - "name": "xAI: Grok 4 Fast", - "display_name": "xAI: Grok 4 Fast", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 2000000, - "output": 131072 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-20", - "last_updated": "2025-09-20", - "cost": { - "input": 0.2, - "output": 0.5 - }, - "type": "chat" - }, - { - "id": "x-ai/grok-4-fast-non-reasoning", - "name": "xAI: Grok 4 Fast None Reasoning", - "display_name": "xAI: Grok 4 Fast None Reasoning", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 2000000, - "output": 30000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", - "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 - }, - "type": "chat" - }, - { - "id": "x-ai/grok-4.1-fast", - "name": "xAI: Grok 4.1 Fast", - "display_name": "xAI: Grok 4.1 Fast", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 2000000, - "output": 131072 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-20", - "last_updated": "2025-11-20", - "cost": { - "input": 0.2, - "output": 0.5 - }, - "type": "chat" - }, - { - "id": "x-ai/grok-4.1-fast-non-reasoning", - "name": "xAI: Grok 4.1 Fast Non Reasoning", - "display_name": "xAI: Grok 4.1 Fast Non Reasoning", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 2000000, - "output": 64000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-11-20", - "last_updated": "2025-11-20", + "release_date": "2026-04-22", + "last_updated": "2026-05-16", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.066, + "output": 0.26, + "cache_read": 0.029 }, "type": "chat" }, @@ -217423,42 +226012,6 @@ }, "type": "chat" }, - { - "id": "x-ai/grok-code-fast-1", - "name": "xAI: Grok Code Fast 1", - "display_name": "xAI: Grok Code Fast 1", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 131072 - }, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-28", - "last_updated": "2025-08-28", - "cost": { - "input": 0.2, - "output": 1.5 - }, - "type": "chat" - }, { "id": "xiaomi/mimo-v2-flash", "name": "Xiaomi: MiMo-V2-Flash", @@ -217506,8 +226059,8 @@ ] }, "limit": { - "context": 265000, - "output": 265000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -217540,8 +226093,8 @@ ] }, "limit": { - "context": 1000000, - "output": 256000 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -217577,8 +226130,8 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -217623,7 +226176,7 @@ }, "limit": { "context": 1048576, - "output": 131072 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -217678,14 +226231,12 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "last_updated": "2026-03-15", "cost": { "input": 0.6, "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "cache_read": 0.175 }, "type": "chat" }, @@ -217713,14 +226264,12 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", "release_date": "2025-07-28", "last_updated": "2025-07-28", "cost": { - "input": 0.2, - "output": 1.1, - "cache_read": 0.03, - "cache_write": 0 + "input": 0.13, + "output": 0.85, + "cache_read": 0.025 }, "type": "chat" }, @@ -217766,8 +226315,8 @@ "display_name": "Z.AI: GLM 4.6V", "modalities": { "input": [ - "text", "image", + "text", "video" ], "output": [ @@ -217775,8 +226324,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -217785,14 +226334,12 @@ "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "open_weights": true, + "release_date": "2025-09-30", + "last_updated": "2026-01-10", "cost": { - "input": 0.14, - "output": 0.42, - "cache_read": 0.03 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, @@ -217881,8 +226428,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 202752, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -217902,14 +226449,13 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": true, + "release_date": "2025-12-22", + "last_updated": "2026-03-15", "cost": { - "input": 0.28, - "output": 1.14, - "cache_read": 0.06 + "input": 0.38, + "output": 1.98, + "cache_read": 0.2 }, "type": "chat" }, @@ -218009,8 +226555,8 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -218031,13 +226577,11 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01-01", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.58, - "output": 2.6, - "cache_read": 0.14 + "input": 0.95, + "output": 3.15 }, "type": "chat" }, @@ -218054,8 +226598,8 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -218068,14 +226612,14 @@ "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2026-03-20", - "last_updated": "2026-03-20", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-15", + "last_updated": "2026-04-11", "cost": { - "input": 0.88, - "output": 3.48 + "input": 1.2, + "output": 4, + "cache_read": 0.24 }, "type": "chat" }, @@ -218092,7 +226636,7 @@ ] }, "limit": { - "context": 200000, + "context": 202752, "output": 131072 }, "temperature": true, @@ -218103,23 +226647,16 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-03", - "last_updated": "2026-04-03", + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.8781, - "output": 3.5126, - "cache_read": 0.1903 + "input": 1.26, + "output": 3.96 }, "type": "chat" }, @@ -218129,18 +226666,17 @@ "display_name": "Z.AI: GLM 5V Turbo", "modalities": { "input": [ - "text", "image", - "video", - "pdf" + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -218148,25 +226684,14 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, - "open_weights": false, + "open_weights": true, "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "last_updated": "2026-04-11", "cost": { - "input": 0.726, - "output": 3.1946, - "cache_read": 0.1743 + "input": 1.2, + "output": 4, + "cache_read": 0.24 }, "type": "chat" } diff --git a/src/renderer/settings/components/DeepChatAgentsSettings.vue b/src/renderer/settings/components/DeepChatAgentsSettings.vue index d282ce06e..9228442b9 100644 --- a/src/renderer/settings/components/DeepChatAgentsSettings.vue +++ b/src/renderer/settings/components/DeepChatAgentsSettings.vue @@ -1301,8 +1301,13 @@ const startCreate = () => { assignForm(emptyForm()) } const resetEditor = () => { - if (selectedAgentId.value === DRAFT_AGENT_ID) startCreate() - else selectAgent(selectedAgentId.value) + const agentId = selectedAgentId.value + if (!agentId || agentId === DRAFT_AGENT_ID) { + startCreate() + return + } + + selectAgent(agentId) } const saveAgent = async () => { if (!form.name.trim()) return diff --git a/src/renderer/settings/components/ProviderModelList.vue b/src/renderer/settings/components/ProviderModelList.vue index 3aa5f83b2..2be6bd096 100644 --- a/src/renderer/settings/components/ProviderModelList.vue +++ b/src/renderer/settings/components/ProviderModelList.vue @@ -713,13 +713,15 @@ type VirtualModelListItem = enableSearch: boolean typeValue: ModelType group: string - contextLength: number - maxTokens: number + contextLength: RENDERER_MODEL_META['contextLength'] + maxTokens: RENDERER_MODEL_META['maxTokens'] isCustom: boolean supportedEndpointTypes: RENDERER_MODEL_META['supportedEndpointTypes'] endpointType: RENDERER_MODEL_META['endpointType'] } +type VirtualModelItem = Extract + const getCachedVirtualItem = ( id: string, factory: () => TItem, @@ -772,7 +774,7 @@ const createProviderActionsItem = (providerId: string) => ) const createModelItem = (model: RENDERER_MODEL_META) => - getCachedVirtualItem( + getCachedVirtualItem( `${model.providerId}-${model.id}`, () => ({ id: `${model.providerId}-${model.id}`, @@ -923,9 +925,7 @@ const getBatchTargetModels = (providerId: string) => { return Array.from(dedupedModels.values()) } -const toRendererModel = ( - item: Extract -): RENDERER_MODEL_META => ({ +const toRendererModel = (item: VirtualModelItem): RENDERER_MODEL_META => ({ id: item.modelId, name: item.name, contextLength: item.contextLength, diff --git a/src/renderer/settings/components/RemoteSettings.vue b/src/renderer/settings/components/RemoteSettings.vue index 469900a14..ef2eec863 100644 --- a/src/renderer/settings/components/RemoteSettings.vue +++ b/src/renderer/settings/components/RemoteSettings.vue @@ -2340,16 +2340,27 @@ const syncWeixinIlinkFields = (snapshot: Partial | nu } } -const channelStatus = (channel: RemoteChannel) => - channel === 'telegram' - ? telegramStatus.value - : channel === 'feishu' - ? feishuStatus.value - : channel === 'qqbot' - ? qqbotStatus.value - : channel === 'discord' - ? discordStatus.value - : weixinIlinkStatus.value +function channelStatus(channel: 'telegram'): TelegramRemoteStatus | null +function channelStatus(channel: 'feishu'): FeishuRemoteStatus | null +function channelStatus(channel: 'qqbot'): QQBotRemoteStatus | null +function channelStatus(channel: 'discord'): DiscordRemoteStatus | null +function channelStatus(channel: 'weixin-ilink'): WeixinIlinkRemoteStatus | null +function channelStatus(channel: RemoteChannel): RemoteChannelStatus | null +function channelStatus(channel: RemoteChannel): RemoteChannelStatus | null { + if (channel === 'telegram') { + return telegramStatus.value + } + if (channel === 'feishu') { + return feishuStatus.value + } + if (channel === 'qqbot') { + return qqbotStatus.value + } + if (channel === 'discord') { + return discordStatus.value + } + return weixinIlinkStatus.value +} const getSnapshotPrincipalIds = ( channel: PairableRemoteChannel, @@ -3105,12 +3116,11 @@ const bindingKindClass = (kind: RemoteBindingSummary['kind']) => { } const formatOverviewLine = (channel: RemoteChannel) => { - const status = channelStatus(channel) - if (!status) { - return '' - } - if (channel === 'telegram') { + const status = channelStatus(channel) + if (!status) { + return '' + } return t('settings.remote.overview.telegram', { bindingCount: status.bindingCount, pairedCount: status.allowedUserCount @@ -3118,6 +3128,10 @@ const formatOverviewLine = (channel: RemoteChannel) => { } if (channel === 'qqbot') { + const status = channelStatus(channel) + if (!status) { + return '' + } return t('settings.remote.overview.qqbot', { bindingCount: status.bindingCount, pairedCount: status.pairedUserCount @@ -3125,6 +3139,10 @@ const formatOverviewLine = (channel: RemoteChannel) => { } if (channel === 'discord') { + const status = channelStatus(channel) + if (!status) { + return '' + } return t('settings.remote.overview.discord', { bindingCount: status.bindingCount, pairedCount: status.pairedChannelCount @@ -3132,6 +3150,10 @@ const formatOverviewLine = (channel: RemoteChannel) => { } if (channel === 'weixin-ilink') { + const status = channelStatus(channel) + if (!status) { + return '' + } return t('settings.remote.overview.weixinIlink', { bindingCount: status.bindingCount, accountCount: status.accountCount, @@ -3139,6 +3161,11 @@ const formatOverviewLine = (channel: RemoteChannel) => { }) } + const status = channelStatus('feishu') + if (!status) { + return '' + } + return t('settings.remote.overview.feishu', { bindingCount: status.bindingCount, pairedCount: status.pairedUserCount diff --git a/src/renderer/src/components/chat/AgentProgressFloat.vue b/src/renderer/src/components/chat/AgentProgressFloat.vue index 845b62a7f..804f929db 100644 --- a/src/renderer/src/components/chat/AgentProgressFloat.vue +++ b/src/renderer/src/components/chat/AgentProgressFloat.vue @@ -11,7 +11,7 @@ type="button" class="agent-progress-trigger group flex min-w-0 flex-1 items-center gap-2.5 rounded-2xl px-2 py-1.5 text-left transition-all duration-200 hover:bg-foreground/[0.035] focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-ring/50" data-testid="agent-progress-float-trigger" - :aria-expanded="String(!collapsed)" + :aria-expanded="!collapsed" :aria-label="t('chat.workspace.plan.section')" @click="emit('toggle-collapse')" > diff --git a/src/renderer/src/components/chat/ChatSearchBar.vue b/src/renderer/src/components/chat/ChatSearchBar.vue index 80f9e4b7b..b04372830 100644 --- a/src/renderer/src/components/chat/ChatSearchBar.vue +++ b/src/renderer/src/components/chat/ChatSearchBar.vue @@ -16,7 +16,7 @@ autocapitalize="off" autocomplete="off" spellcheck="false" - @update:model-value="emit('update:modelValue', $event)" + @update:model-value="handleModelValueUpdate" @keydown="handleKeydown" /> @@ -115,6 +115,10 @@ const selectInput = () => { element?.select() } +const handleModelValueUpdate = (value: string | number) => { + emit('update:modelValue', String(value)) +} + const handleKeydown = (event: KeyboardEvent) => { if (event.key === 'Escape') { event.preventDefault() diff --git a/src/renderer/src/components/chat/ChatStatusBar.vue b/src/renderer/src/components/chat/ChatStatusBar.vue index 7d479c971..77817d13a 100644 --- a/src/renderer/src/components/chat/ChatStatusBar.vue +++ b/src/renderer/src/components/chat/ChatStatusBar.vue @@ -993,6 +993,9 @@ type ModelSelection = { modelId: string } +type ReasoningEffortValue = NonNullable +type VerbosityValue = NonNullable + const isSameModelSelection = ( left: ModelSelection | null | undefined, right: ModelSelection | null | undefined @@ -1533,7 +1536,7 @@ const resolveCapabilityProviderIdForSelection = ( const getReasoningEffortOptions = ( portrait: ReasoningPortrait | null | undefined -): SessionGenerationSettings['reasoningEffort'][] => { +): ReasoningEffortValue[] => { if ( !portrait || portrait.mode === 'budget' || @@ -1556,14 +1559,12 @@ const getReasoningEffortOptions = ( : [portrait.effort] } -const getVerbosityOptions = ( - portrait: ReasoningPortrait | null | undefined -): SessionGenerationSettings['verbosity'][] => { +const getVerbosityOptions = (portrait: ReasoningPortrait | null | undefined): VerbosityValue[] => { const options = portrait?.verbosityOptions?.filter(isVerbosity) if (options && options.length > 0) { return options } - return isVerbosity(portrait?.verbosity) ? [...DEFAULT_VERBOSITY_OPTIONS] : [] + return isVerbosity(portrait?.verbosity) ? DEFAULT_VERBOSITY_OPTIONS.filter(isVerbosity) : [] } const getReasoningVisibilityOptions = ( diff --git a/src/renderer/src/components/chat/ChatToolInteractionOverlay.vue b/src/renderer/src/components/chat/ChatToolInteractionOverlay.vue index 90ef40913..62400d2e6 100644 --- a/src/renderer/src/components/chat/ChatToolInteractionOverlay.vue +++ b/src/renderer/src/components/chat/ChatToolInteractionOverlay.vue @@ -78,7 +78,8 @@ import { computed } from 'vue' import { useI18n } from 'vue-i18n' import { Button } from '@shadcn/components/ui/button' import { Icon } from '@iconify/vue' -import type { AssistantMessageBlock, ToolInteractionResponse } from '@shared/types/agent-interface' +import type { ToolInteractionResponse } from '@shared/types/agent-interface' +import type { DisplayAssistantMessageBlock } from '@/components/chat/messageListItems' type PendingInteractionView = { messageId: string @@ -86,7 +87,7 @@ type PendingInteractionView = { actionType: 'question_request' | 'tool_call_permission' toolName: string toolArgs: string - block: AssistantMessageBlock + block: DisplayAssistantMessageBlock } const props = defineProps<{ diff --git a/src/renderer/src/components/message/MessageBlockThink.vue b/src/renderer/src/components/message/MessageBlockThink.vue index d72213fae..77bb49cc6 100644 --- a/src/renderer/src/components/message/MessageBlockThink.vue +++ b/src/renderer/src/components/message/MessageBlockThink.vue @@ -38,10 +38,30 @@ const UPDATE_INTERVAL = 1000 const UPDATE_OFFSET = 80 let updateTimer: ReturnType | null = null +type ReasoningTimeRange = { + start: number + end: number +} + +const toReasoningTimeRange = ( + value: DisplayAssistantMessageBlock['reasoning_time'] +): ReasoningTimeRange | null => { + if (!value || typeof value !== 'object') { + return null + } + + return typeof value.start === 'number' && typeof value.end === 'number' + ? { start: value.start, end: value.end } + : null +} + +const reasoningTimeRange = computed(() => toReasoningTimeRange(props.block.reasoning_time)) + const reasoningDuration = computed(() => { let duration = 0 - if (props.block.reasoning_time) { - duration = (props.block.reasoning_time.end - props.block.reasoning_time.start) / 1000 + const range = reasoningTimeRange.value + if (range) { + duration = (range.end - range.start) / 1000 } else { duration = (props.usage.reasoning_end_time - props.usage.reasoning_start_time) / 1000 } @@ -69,7 +89,7 @@ const scheduleNextUpdate = () => { const fallbackDuration = Number.isFinite(reasoningDuration.value) ? reasoningDuration.value * 1000 : 0 - const startTimestamp = props.block.reasoning_time?.start ?? Date.now() - fallbackDuration + const startTimestamp = reasoningTimeRange.value?.start ?? Date.now() - fallbackDuration const now = Date.now() const elapsed = Math.max(0, now - startTimestamp) const remainder = elapsed % UPDATE_INTERVAL @@ -108,7 +128,7 @@ watch( ) const statusWatchSource = () => - [props.block.status, props.block.reasoning_time?.start, props.block.reasoning_time?.end] as const + [props.block.status, reasoningTimeRange.value?.start, reasoningTimeRange.value?.end] as const const handleStatusChange = useThrottleFn( () => { diff --git a/src/renderer/src/pages/ChatPage.vue b/src/renderer/src/pages/ChatPage.vue index b2b64c958..e384a3dbd 100644 --- a/src/renderer/src/pages/ChatPage.vue +++ b/src/renderer/src/pages/ChatPage.vue @@ -1001,7 +1001,7 @@ type PendingInteractionView = { actionType: 'question_request' | 'tool_call_permission' toolName: string toolArgs: string - block: AssistantMessageBlock + block: DisplayAssistantMessageBlock } type SubagentProgressPayload = { @@ -1011,7 +1011,7 @@ type SubagentProgressPayload = { type: 'permission' | 'question' messageId: string toolCallId: string - actionBlock: AssistantMessageBlock + actionBlock: DisplayAssistantMessageBlock } | null }> }